繁体   English   中英

无法将PostgreSQL中的文件作为大对象存储并读取

[英]Can't store and then read Files in PostgreSQL as large objects

我正在尝试使用NpgSQL v3.0.4.0向PostgreSQL数据库V9.4.x写入和读取大对象,因此我制定了一种将本地文件作为大对象存储在数据库中的方法,如下所示:

public static async Task<uint> InsertLargeObjectFileToDB(string theFilePath)
{
     // connecting to DB
     string connstring = MakeDatabaseConnectionString();
     // make a connection object
     NpgsqlConnection Conn = new NpgsqlConnection(connstring);
     try
     {
        await OpenDatabaseConnection(Conn); //open database connection
     }
     catch (Exception Ex)
     {
        throw (Ex);
     }

     uint oid; // to store object ID number
     try
     {
        // Reading and writing Large Objects requires the use of a transaction

        using (FileStream fs = new FileStream(theFilePath, FileMode.Open))
        {
           using (var transaction = Conn.BeginTransaction())
           {
              // Retrieve a Large Object Manager for this connection
              var manager = new NpgsqlLargeObjectManager(Conn);
              // Create a new empty file, returning the identifier to later access it
              oid = manager.Create();

              using (var DbStream = manager.OpenReadWrite(oid))
              {
                 long theFileSize = GetFileSizeInBytes(theFilePath);
                 StreamReader sr = new StreamReader(fs);
                 byte[] buffer = new byte[1024 * 1024];

                 while (sr.BaseStream.Position < theFileSize)
                 {
                    await fs.ReadAsync(buffer, 0, buffer.Length);
                    await DbStream.WriteAsync(buffer, 0, buffer.Length);
                 }
              }
              transaction.Commit();
              return oid;
           }
        }
     }
     catch // any error
     {
        // exception
        Exception ex = new Exception();
        ex.Data.Add(ex.Data.Count, "some error message");
        throw ex;
     }
}

然后,我制作了一种方法来读取大对象并将其存储在temp目录中的随机命名文件中,如下所示:

public static async Task<string> GetLargeObjectFileFromDB(uint oid)
{
     // connecting to DB
     string connstring = MakeDatabaseConnectionString();
     // make a connection object
     NpgsqlConnection Conn = new NpgsqlConnection(connstring);
     try
     {
        await OpenDatabaseConnection(Conn); //open database connection
     }
     catch (Exception Ex)
     {
        throw (Ex);
     }

     // getting a temorary file name from the system to use it to store the fetched file
     string TempFileName = GetRandomFileNameFromSystem();

     try
     {
        using (FileStream LocalStream = new FileStream(TempFileName, FileMode.Create))
        {
           using (var transaction = Conn.BeginTransaction())
           {
              // create a Large Object Manager for this connection
              var DbLargeObjectManager = new NpgsqlLargeObjectManager(Conn);

              using (var DbStream = await DbLargeObjectManager.OpenReadAsync(oid))
              {
                 byte[] buffer = new byte[1024 * 1024];
                 // get the length of the database object
                 long LengthOfDbObject = DbStream.Length;

                 while (DbStream.Position < LengthOfDbObject)
                 {
                    // read from the database to buffer
                    await DbStream.ReadAsync(buffer, 0, buffer.Length);
                    //write from buffer to local file
                    await LocalStream.WriteAsync(buffer, 0, buffer.Length);
                 }
              }
              transaction.Commit();
              return TempFileName;
           }
        }
     }
     catch // any error
     {
        // exception
        Exception ex = new Exception();
        ex.Data.Add(ex.Data.Count, "Error inserting object in database");
        throw ex;
     }
 }

如您所见,我一直在异步编写。 问题是我对这2种方法进行了测试,并且此测试将6MB文件写入数据库,但是当我再次从数据库中读取该文件时,文件大约大了400 kb,(当然)MD5哈希不匹配。 不要忘了说,没有例外发生过。 如果您关心的话,这是测试:

private async void button3_Click(object sender, EventArgs e)
  {
     listBox1.Items.Clear();

     // getting the MD5 hash of the source file
     string FirstMd5Hash = GetMd5OfFile(tbSourceFile.Text);

     // performance measurment ##########################################
     DateTime dt1 = new DateTime(DateTime.Now.Ticks);
     listBox1.Items.Add("Uploading file to database");
     //storing that file into database
     uint oid = await InsertLargeObjectFileToDB(tbSourceFile.Text);

     // performance measurment #########################################################
     DateTime dt2 = new DateTime(DateTime.Now.Ticks);
     TimeSpan ts = new TimeSpan(dt2.Ticks - dt1.Ticks);
     listBox1.Items.Add("Large object (oid = " + oid + ") inserted in " + ts.Seconds + "." + ts.Milliseconds + " seconds");

     // performance measurment ##########################################
     dt1 = new DateTime(DateTime.Now.Ticks);
     listBox1.Items.Add("reading file back from the database");
     // get that object back from the database into temporary file
     string ReturnedFileName = await PostgresqlLargeObject.GetLargeObjectFileFromDB(oid);
     // performance measurment #########################################################
     dt2 = new DateTime(DateTime.Now.Ticks);
     ts = new TimeSpan(dt2.Ticks - dt1.Ticks);
     listBox1.Items.Add("reading done in " + ts.Seconds + "." + ts.Milliseconds + " seconds");


     //calculate md5 of that file
     string SecondMd5Hash = GetMd5OfFile(ReturnedFileName);

     // compare the 2 hashes
     if (FirstMd5Hash == SecondMd5Hash)
     {
        listBox1.Items.Add("the hashes are match . MD5 = " + FirstMd5Hash);
     }
     else
     {
        listBox1.Items.Add("failed with oid = " + oid);
        tbFileBack.Text = ReturnedFileName;
     }
 }

怎么了?

好的,我已经解决了这个问题,事实证明(除了考虑Emil的答案),您还必须异步读取然后同步写入。 我不知道为什么。 此代码的工作原理:

using (FileStream LocalStream = new FileStream(TempFileName, FileMode.Create))
            {
               using (var transaction = Conn.BeginTransaction())
               {
                  // create a Large Object Manager for this connection
                  var DbLargeObjectManager = new NpgsqlLargeObjectManager(Conn);

                  using (var DbStream = await DbLargeObjectManager.OpenReadAsync(oid))
                  {
                     byte[] buffer = new byte[262144]; //256KB
                     // query the database stream length
                     long DatabaseStreamLength = DbStream.Length;
                     while (DbStream.Position < DatabaseStreamLength)
                     {
                        // read from the database to buffer (async)
                        int bufferByteCount = await DbStream.ReadAsync(buffer, 0, buffer.Length);
                        //write from buffer to local file (sync)
                        LocalStream.Write(buffer, 0, bufferByteCount);
                     }
                  }
                  transaction.Commit();

当执行await <stream>.WriteAsync(buffer, 0, buffer.Length); 您应该写入由上一个read方法实际读取的字节数(将返回该值)。

暂无
暂无

声明:本站的技术帖子网页,遵循CC BY-SA 4.0协议,如果您需要转载,请注明本站网址或者原文地址。任何问题请咨询:yoyou2525@163.com.

 
粤ICP备18138465号  © 2020-2024 STACKOOM.COM