|
| 1 | +// Licensed to the .NET Foundation under one or more agreements. |
| 2 | +// The .NET Foundation licenses this file to you under the MIT license. |
| 3 | +// See the LICENSE file in the project root for more information. |
| 4 | + |
| 5 | +using Microsoft.ML.Core.Data; |
| 6 | +using Microsoft.ML.Runtime.Model; |
| 7 | +using System.IO; |
| 8 | + |
| 9 | +namespace Microsoft.ML.Runtime.Data |
| 10 | +{ |
| 11 | + /// <summary> |
| 12 | + /// This class represents a data reader that applies a transformer chain after reading. |
| 13 | + /// It also has methods to save itself to a repository. |
| 14 | + /// </summary> |
| 15 | + public sealed class CompositeDataReader<TSource, TLastTransformer> : IDataReader<TSource> |
| 16 | + where TLastTransformer : class, ITransformer |
| 17 | + { |
| 18 | + /// <summary> |
| 19 | + /// The underlying data reader. |
| 20 | + /// </summary> |
| 21 | + public readonly IDataReader<TSource> Reader; |
| 22 | + /// <summary> |
| 23 | + /// The chain of transformers (possibly empty) that are applied to data upon reading. |
| 24 | + /// </summary> |
| 25 | + public readonly TransformerChain<TLastTransformer> Transformer; |
| 26 | + |
| 27 | + public CompositeDataReader(IDataReader<TSource> reader, TransformerChain<TLastTransformer> transformerChain = null) |
| 28 | + { |
| 29 | + Contracts.CheckValue(reader, nameof(reader)); |
| 30 | + Contracts.CheckValueOrNull(transformerChain); |
| 31 | + |
| 32 | + Reader = reader; |
| 33 | + Transformer = transformerChain ?? new TransformerChain<TLastTransformer>(); |
| 34 | + } |
| 35 | + |
| 36 | + public IDataView Read(TSource input) |
| 37 | + { |
| 38 | + var idv = Reader.Read(input); |
| 39 | + idv = Transformer.Transform(idv); |
| 40 | + return idv; |
| 41 | + } |
| 42 | + |
| 43 | + public ISchema GetOutputSchema() |
| 44 | + { |
| 45 | + var s = Reader.GetOutputSchema(); |
| 46 | + return Transformer.GetOutputSchema(s); |
| 47 | + } |
| 48 | + |
| 49 | + /// <summary> |
| 50 | + /// Append a new transformer to the end. |
| 51 | + /// </summary> |
| 52 | + /// <returns>The new composite data reader</returns> |
| 53 | + public CompositeDataReader<TSource, TNewLast> AppendTransformer<TNewLast>(TNewLast transformer) |
| 54 | + where TNewLast : class, ITransformer |
| 55 | + { |
| 56 | + Contracts.CheckValue(transformer, nameof(transformer)); |
| 57 | + |
| 58 | + return new CompositeDataReader<TSource, TNewLast>(Reader, Transformer.Append(transformer)); |
| 59 | + } |
| 60 | + |
| 61 | + /// <summary> |
| 62 | + /// Save the contents to a stream, as a "model file". |
| 63 | + /// </summary> |
| 64 | + public void SaveTo(IHostEnvironment env, Stream outputStream) |
| 65 | + { |
| 66 | + Contracts.CheckValue(env, nameof(env)); |
| 67 | + env.CheckValue(outputStream, nameof(outputStream)); |
| 68 | + |
| 69 | + env.Check(outputStream.CanWrite && outputStream.CanSeek, "Need a writable and seekable stream to save"); |
| 70 | + using (var ch = env.Start("Saving pipeline")) |
| 71 | + { |
| 72 | + using (var rep = RepositoryWriter.CreateNew(outputStream, ch)) |
| 73 | + { |
| 74 | + ch.Trace("Saving data reader"); |
| 75 | + ModelSaveContext.SaveModel(rep, Reader, "Reader"); |
| 76 | + |
| 77 | + ch.Trace("Saving transformer chain"); |
| 78 | + ModelSaveContext.SaveModel(rep, Transformer, TransformerChain.LoaderSignature); |
| 79 | + rep.Commit(); |
| 80 | + } |
| 81 | + } |
| 82 | + } |
| 83 | + } |
| 84 | + |
| 85 | + /// <summary> |
| 86 | + /// Utility class to facilitate loading from a stream. |
| 87 | + /// </summary> |
| 88 | + public static class CompositeDataReader |
| 89 | + { |
| 90 | + /// <summary> |
| 91 | + /// Load the pipeline from stream. |
| 92 | + /// </summary> |
| 93 | + public static CompositeDataReader<IMultiStreamSource, ITransformer> LoadFrom(IHostEnvironment env, Stream stream) |
| 94 | + { |
| 95 | + Contracts.CheckValue(env, nameof(env)); |
| 96 | + env.CheckValue(stream, nameof(stream)); |
| 97 | + |
| 98 | + env.Check(stream.CanRead && stream.CanSeek, "Need a readable and seekable stream to load"); |
| 99 | + using (var rep = RepositoryReader.Open(stream, env)) |
| 100 | + using (var ch = env.Start("Loading pipeline")) |
| 101 | + { |
| 102 | + ch.Trace("Loading data reader"); |
| 103 | + ModelLoadContext.LoadModel<IDataReader<IMultiStreamSource>, SignatureLoadModel>(env, out var reader, rep, "Reader"); |
| 104 | + |
| 105 | + ch.Trace("Loader transformer chain"); |
| 106 | + ModelLoadContext.LoadModel<TransformerChain<ITransformer>, SignatureLoadModel>(env, out var transformerChain, rep, TransformerChain.LoaderSignature); |
| 107 | + return new CompositeDataReader<IMultiStreamSource, ITransformer>(reader, transformerChain); |
| 108 | + } |
| 109 | + } |
| 110 | + } |
| 111 | +} |
0 commit comments