|  | 
|  | 1 | +// Licensed to the Apache Software Foundation (ASF) under one | 
|  | 2 | +// or more contributor license agreements.  See the NOTICE file | 
|  | 3 | +// distributed with this work for additional information | 
|  | 4 | +// regarding copyright ownership.  The ASF licenses this file | 
|  | 5 | +// to you under the Apache License, Version 2.0 (the | 
|  | 6 | +// "License"); you may not use this file except in compliance | 
|  | 7 | +// with the License.  You may obtain a copy of the License at | 
|  | 8 | +// | 
|  | 9 | +//   http://www.apache.org/licenses/LICENSE-2.0 | 
|  | 10 | +// | 
|  | 11 | +// Unless required by applicable law or agreed to in writing, | 
|  | 12 | +// software distributed under the License is distributed on an | 
|  | 13 | +// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY | 
|  | 14 | +// KIND, either express or implied.  See the License for the | 
|  | 15 | +// specific language governing permissions and limitations | 
|  | 16 | +// under the License. | 
|  | 17 | + | 
|  | 18 | +use crate::io::{FileRead, InputFile}; | 
|  | 19 | +use crate::puffin::blob::Blob; | 
|  | 20 | +use crate::puffin::metadata::{BlobMetadata, FileMetadata}; | 
|  | 21 | +use crate::Result; | 
|  | 22 | + | 
|  | 23 | +/// Puffin reader | 
|  | 24 | +pub(crate) struct PuffinReader { | 
|  | 25 | +    input_file: InputFile, | 
|  | 26 | +    file_metadata: Option<FileMetadata>, | 
|  | 27 | +} | 
|  | 28 | + | 
|  | 29 | +impl PuffinReader { | 
|  | 30 | +    /// Returns a new Puffin reader | 
|  | 31 | +    pub(crate) fn new(input_file: InputFile) -> Self { | 
|  | 32 | +        Self { | 
|  | 33 | +            input_file, | 
|  | 34 | +            file_metadata: None, | 
|  | 35 | +        } | 
|  | 36 | +    } | 
|  | 37 | + | 
|  | 38 | +    /// Returns file metadata | 
|  | 39 | +    pub(crate) async fn file_metadata(&mut self) -> Result<&FileMetadata> { | 
|  | 40 | +        if let Some(ref file_metadata) = self.file_metadata { | 
|  | 41 | +            Ok(file_metadata) | 
|  | 42 | +        } else { | 
|  | 43 | +            let file_metadata = FileMetadata::read(&self.input_file).await?; | 
|  | 44 | +            Ok(self.file_metadata.insert(file_metadata)) | 
|  | 45 | +        } | 
|  | 46 | +    } | 
|  | 47 | + | 
|  | 48 | +    /// Returns blob | 
|  | 49 | +    pub(crate) async fn blob(&self, blob_metadata: BlobMetadata) -> Result<Blob> { | 
|  | 50 | +        let file_read = self.input_file.reader().await?; | 
|  | 51 | +        let start = blob_metadata.offset; | 
|  | 52 | +        let end = start + blob_metadata.length; | 
|  | 53 | +        let bytes = file_read.read(start..end).await?.to_vec(); | 
|  | 54 | +        let data = blob_metadata.compression_codec.decompress(bytes)?; | 
|  | 55 | + | 
|  | 56 | +        Ok(Blob { | 
|  | 57 | +            r#type: blob_metadata.r#type, | 
|  | 58 | +            fields: blob_metadata.fields, | 
|  | 59 | +            snapshot_id: blob_metadata.snapshot_id, | 
|  | 60 | +            sequence_number: blob_metadata.sequence_number, | 
|  | 61 | +            data, | 
|  | 62 | +            properties: blob_metadata.properties, | 
|  | 63 | +        }) | 
|  | 64 | +    } | 
|  | 65 | +} | 
|  | 66 | + | 
|  | 67 | +#[cfg(test)] | 
|  | 68 | +mod tests { | 
|  | 69 | + | 
|  | 70 | +    use crate::puffin::reader::PuffinReader; | 
|  | 71 | +    use crate::puffin::test_utils::{ | 
|  | 72 | +        blob_0, blob_1, java_uncompressed_metric_input_file, | 
|  | 73 | +        java_zstd_compressed_metric_input_file, uncompressed_metric_file_metadata, | 
|  | 74 | +        zstd_compressed_metric_file_metadata, | 
|  | 75 | +    }; | 
|  | 76 | + | 
|  | 77 | +    #[tokio::test] | 
|  | 78 | +    async fn test_puffin_reader_uncompressed_metric_data() { | 
|  | 79 | +        let input_file = java_uncompressed_metric_input_file(); | 
|  | 80 | +        let mut puffin_reader = PuffinReader::new(input_file); | 
|  | 81 | + | 
|  | 82 | +        let file_metadata = puffin_reader.file_metadata().await.unwrap().clone(); | 
|  | 83 | +        assert_eq!(file_metadata, uncompressed_metric_file_metadata()); | 
|  | 84 | + | 
|  | 85 | +        assert_eq!( | 
|  | 86 | +            puffin_reader | 
|  | 87 | +                .blob(file_metadata.blobs.first().unwrap().clone()) | 
|  | 88 | +                .await | 
|  | 89 | +                .unwrap(), | 
|  | 90 | +            blob_0() | 
|  | 91 | +        ); | 
|  | 92 | + | 
|  | 93 | +        assert_eq!( | 
|  | 94 | +            puffin_reader | 
|  | 95 | +                .blob(file_metadata.blobs.get(1).unwrap().clone()) | 
|  | 96 | +                .await | 
|  | 97 | +                .unwrap(), | 
|  | 98 | +            blob_1(), | 
|  | 99 | +        ) | 
|  | 100 | +    } | 
|  | 101 | + | 
|  | 102 | +    #[tokio::test] | 
|  | 103 | +    async fn test_puffin_reader_zstd_compressed_metric_data() { | 
|  | 104 | +        let input_file = java_zstd_compressed_metric_input_file(); | 
|  | 105 | +        let mut puffin_reader = PuffinReader::new(input_file); | 
|  | 106 | + | 
|  | 107 | +        let file_metadata = puffin_reader.file_metadata().await.unwrap().clone(); | 
|  | 108 | +        assert_eq!(file_metadata, zstd_compressed_metric_file_metadata()); | 
|  | 109 | + | 
|  | 110 | +        assert_eq!( | 
|  | 111 | +            puffin_reader | 
|  | 112 | +                .blob(file_metadata.blobs.first().unwrap().clone()) | 
|  | 113 | +                .await | 
|  | 114 | +                .unwrap(), | 
|  | 115 | +            blob_0() | 
|  | 116 | +        ); | 
|  | 117 | + | 
|  | 118 | +        assert_eq!( | 
|  | 119 | +            puffin_reader | 
|  | 120 | +                .blob(file_metadata.blobs.get(1).unwrap().clone()) | 
|  | 121 | +                .await | 
|  | 122 | +                .unwrap(), | 
|  | 123 | +            blob_1(), | 
|  | 124 | +        ) | 
|  | 125 | +    } | 
|  | 126 | +} | 
0 commit comments