You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

96 lines
2.9 KiB

Imports System.IO
Imports System.Runtime.CompilerServices
Imports Microsoft.VisualBasic.Data.IO
Imports Microsoft.VisualBasic.Language
Imports Microsoft.VisualBasic.Linq
Imports Microsoft.VisualBasic.Math.LinearAlgebra
Imports Microsoft.VisualBasic.Net.Http
Public Module VectorIOExtensions
<Extension>
Public Sub Serialize(vec As Vector, save As Stream, Optional chunkSize% = 1024)
Dim chunks = vec.Array.Split(chunkSize)
Dim bytes As Byte()
Dim ms As MemoryStream
Dim buffers As New List(Of MemoryStream)
' chunksize int (校验用)
' chunks int
' index1 long length1 long
' index2 long length2 long
' ...
' gzipchunk1 bytes
' gzipchunk2 bytes
' ...
For Each chunk As Double() In chunks
bytes = chunk _
.Select(AddressOf BitConverter.GetBytes) _
.IteratesALL _
.ToArray
' 对一个chunk做gzip压缩
ms = New MemoryStream(bytes).GZipStream
buffers += ms
Next
Dim writer As New BinaryDataWriter(save)
writer.Write(chunkSize)
writer.Write(buffers.Count)
Dim index As New List(Of (offset&, size&))
Dim offset As Long = 8 + (8 + 8) * buffers.Count
For Each chunk As MemoryStream In buffers
index += (offset, chunk.Length)
offset += chunk.Length
Next
For Each offsetIndex In index
Call writer.Write(offsetIndex.offset)
Call writer.Write(offsetIndex.size)
Next
For Each chunk As MemoryStream In buffers
Call writer.Write(chunk)
Next
Call writer.Flush()
End Sub
<Extension>
Public Function LoadVector(reads As Stream) As Vector
Dim data As New List(Of Double)
Using reader As New BinaryDataReader(reads)
Dim chunkSize = reader.ReadInt32
Dim chunks = reader.ReadInt32
Dim offset, size As Long
Dim buffer As MemoryStream
For i As Integer = 0 To chunks - 1
offset = reader.ReadInt64
size = reader.ReadInt64
reader.Mark()
' goback to original
reader.Seek(-(4 + 4 + 16 * (i + 1)), SeekOrigin.Current)
' then goto data offset
reader.Seek(offset, SeekOrigin.Current)
' read gzip data chunk and then ungzip
buffer = reader.ReadBytes(size).UnGzipStream
' back to doubles
data += buffer.ToArray _
.Split(8) _
.Select(Function(bytes)
Return BitConverter.ToDouble(bytes, Scan0)
End Function)
reader.Reset()
Next
End Using
Return New Vector(data)
End Function
End Module