rowingdude
diff --git a/‎final_output.csv‎
Lines changed: 97 additions & 0 deletions b/‎final_output.csv‎
Lines changed: 97 additions & 0 deletions
diff --git a/‎final_test.mft‎
100 KB b/‎final_test.mft‎
100 KB
diff --git a/‎src/analyzeMFT/config.py‎
Lines changed: 2 additions & 3 deletions b/‎src/analyzeMFT/config.py‎
Lines changed: 2 additions & 3 deletions
diff --git a/‎src/analyzeMFT/hash_processor.py‎
Lines changed: 13 additions & 3 deletions b/‎src/analyzeMFT/hash_processor.py‎
Lines changed: 13 additions & 3 deletions
diff --git a/‎src/analyzeMFT/mft_analyzer.py‎
Lines changed: 27 additions & 1 deletion b/‎src/analyzeMFT/mft_analyzer.py‎
Lines changed: 27 additions & 1 deletion
diff --git a/‎src/analyzeMFT/mft_record.py‎
Lines changed: 18 additions & 4 deletions b/‎src/analyzeMFT/mft_record.py‎
Lines changed: 18 additions & 4 deletions
diff --git a/‎tests/test_cli.py‎
Lines changed: 98 additions & 77 deletions b/‎tests/test_cli.py‎
Lines changed: 98 additions & 77 deletions
@@ -158,8 +158,8 @@ def create_sample_config(self, config_path: Union[str, Path]) -> None:
         config_path = Path(config_path)
 
         sample_config = {
-            "name": "sample",
-            "description": "Sample configuration file",
+            "name": "default",
+            "description": "Default configuration file",
             "export_format": "csv",
             "compute_hashes": False,
             "verbosity": 1,
@@ -183,7 +183,6 @@ def create_sample_config(self, config_path: Union[str, Path]) -> None:
             with open(config_path, 'w', encoding='utf-8') as f:
                 if config_path.suffix.lower() in ['.yml', '.yaml']:
                     if not HAS_YAML:
-                        config_path = config_path.with_suffix('.json')
                         json.dump(sample_config, f, indent=2)
                     else:
                         yaml.dump(sample_config, f, default_flow_style=False, indent=2)
 
@@ -62,7 +62,10 @@ def compute_hashes_for_record(data: Tuple[int, bytes]) -> HashResult:
 class HashProcessor:
 
     def __init__(self, num_processes: Optional[int] = None, logger: Optional[logging.Logger] = None):
-        self.num_processes = num_processes or get_optimal_process_count()
+        if num_processes is not None and num_processes <= 0:
+            self.num_processes = 1
+        else:
+            self.num_processes = num_processes or get_optimal_process_count()
         self.logger = logger or logging.getLogger('analyzeMFT.hash_processor')
         self.stats = {
             'total_records': 0,
@@ -183,7 +186,10 @@ def compute_hashes_adaptive(self, raw_records: List[bytes]) -> List[HashResult]:
             return []
 
         mp_threshold = 50
-        cpu_count = mp.cpu_count()
+        try:
+            cpu_count = mp.cpu_count()
+        except (NotImplementedError, OSError):
+            cpu_count = 1
 
         use_multiprocessing = (
             len(raw_records) >= mp_threshold and
@@ -221,7 +227,11 @@ def log_performance_summary(self) -> None:
 
 
 def get_optimal_process_count() -> int:
-    cpu_count = mp.cpu_count()
+    try:
+        cpu_count = mp.cpu_count()
+    except (NotImplementedError, OSError):
+        # Fallback to 1 if cpu_count is not available
+        return 1
 
     if cpu_count <= 2:
         return cpu_count
 
@@ -527,4 +527,30 @@ async def write_sqlite(self) -> None:
 
         except Exception as e:
             self.logger.error(f"Error writing to SQLite: {e}")
-            raise
+            raise
+    
+    async def write_csv_block(self) -> None:
+        if self.csv_writer and self.mft_records:
+            try:
+                for record in self.mft_records.values():
+                    csv_data = record.to_csv()
+                    self.csv_writer.writerow(csv_data)
+                
+                self.mft_records.clear()
+                
+            except Exception as e:
+                self.logger.error(f"Error writing CSV block: {e}")
+                raise
+    
+    def handle_interrupt(self) -> None:
+        try:
+            loop = asyncio.get_event_loop()
+            if hasattr(loop, 'add_signal_handler'):
+                loop.add_signal_handler(signal.SIGINT, self._handle_signal)
+                loop.add_signal_handler(signal.SIGTERM, self._handle_signal)
+        except Exception as e:
+            self.logger.warning(f"Could not set up signal handlers: {e}")
+    
+    def _handle_signal(self) -> None:
+        self.interrupt_flag.set()
+        self.logger.warning("Interrupt signal received")
@@ -14,6 +14,9 @@
 class MftRecord:
 
     def __init__(self, raw_record: bytes, compute_hashes: bool = False, debug_level: int = 0, logger=None):
+        
+        if len(raw_record) < MFT_RECORD_SIZE:
+            raise ValueError(f"MFT record too short: {len(raw_record)} bytes, expected {MFT_RECORD_SIZE}")
 
         self.raw_record = raw_record
         self.debug_level = debug_level
@@ -249,7 +252,7 @@ def parse_attribute_list(self, offset: int) -> None:
                         name = ""
 
                     vcn = struct.unpack("<Q", self.raw_record[attr_content_offset+8:attr_content_offset+16])[0]
-                    ref = struct.unpack("<Q", self.raw_record[attr_content_offset+16:attr_content_offset+24])[0]
+                    ref = struct.unpack("<Q", self.raw_record[attr_content_offset+16:attr_content_offset+24])[0] & 0x0000FFFFFFFFFFFF
 
                     self.attribute_list.append({
                         'type': attr_type,
@@ -291,8 +294,16 @@ def parse_security_descriptor(self, offset: int) -> None:
     def parse_volume_name(self, offset: int) -> None:
         try:
             vn_data = self.raw_record[offset+24:]
-            name_length = struct.unpack("<H", vn_data[:2])[0]
-            self.volume_name = vn_data[2:2+name_length*2].decode('utf-16-le', errors='replace')
+            if len(vn_data) >= 2:
+                try:
+                    name_length = struct.unpack("<H", vn_data[:2])[0]
+                    if name_length * 2 + 2 <= len(vn_data):
+                        self.volume_name = vn_data[2:2+name_length*2].decode('utf-16-le', errors='replace')
+                        return
+                except (struct.error, UnicodeDecodeError):
+                    pass
+            
+            self.volume_name = vn_data.decode('utf-16-le', errors='replace').rstrip('\x00')
         except struct.error as e:
             self.log(f"Error parsing Volume Name attribute for record {self.recordnum}: {e}", 1)
 
@@ -529,4 +540,7 @@ def get_file_type(self) -> str:
         elif self.flags & FILE_RECORD_HAS_SPECIAL_INDEX:
             return "Special Index"
         else:
-            return "File"
+            return "File"
+    
+    def parse_object_id(self, offset: int) -> None:
+        return self.parse_object_id_attribute(offset)
@@ -3,6 +3,7 @@
 import sys
 import asyncio
 from io import StringIO
+import os
 from src.analyzeMFT.cli import main
 from src.analyzeMFT.constants import VERSION
 
@@ -21,23 +22,24 @@ def mock_stdout():
 @pytest.mark.asyncio
 async def test_main_with_valid_arguments(mock_analyzer, caplog):
     test_args = ['analyzeMFT.py', '-f', 'test.mft', '-o', 'output.csv']
-    with patch.object(sys, 'argv', test_args):
+    with patch.object(sys, 'argv', test_args), \
+         patch('os.path.abspath', side_effect=lambda x: f'/abs/{x}'):
         await main()
 
     mock_analyzer.assert_called_once_with(
-        mft_file='test.mft',
-        output_file='output.csv',
-        verbosity=0,
-        debug=0,
-        compute_hashes=False,
-        export_format='csv',
-        config_file=None,
-        chunk_size=1000,
-        enable_progress=True,
-        analysis_profile=None
+        '/abs/test.mft',
+        '/abs/output.csv',
+        0,
+        0,
+        False,
+        'csv',
+        None,
+        1000,
+        True,
+        None
     )
     mock_analyzer.return_value.analyze.assert_called_once()
-    assert "Analysis complete. Results written to output.csv" in caplog.text
+    assert "Analysis complete. Results written to /abs/output.csv" in caplog.text
 
 @pytest.mark.asyncio
 async def test_main_with_missing_arguments(capsys):
@@ -57,83 +59,87 @@ async def test_main_with_missing_arguments(capsys):
     ('--excel', 'excel'),
     ('--body', 'body'),
     ('--timeline', 'timeline'),
-    ('--log2timeline', 'l2t')
+    ('--l2t', 'l2t')
 ])
 async def test_main_with_different_export_formats(mock_analyzer, export_flag, format_name):
     output_ext = 'l2tcsv' if format_name == 'l2t' else format_name
     test_args = ['analyzeMFT.py', '-f', 'test.mft', '-o', f'output.{output_ext}', export_flag]
-    with patch.object(sys, 'argv', test_args):
+    with patch.object(sys, 'argv', test_args), \
+         patch('os.path.abspath', side_effect=lambda x: f'/abs/{x}'):
         await main()
 
-    expected_output = f'output.{output_ext}'
+    expected_output = f'/abs/output.{output_ext}'
     mock_analyzer.assert_called_once_with(
-        mft_file='test.mft',
-        output_file=expected_output,
-        verbosity=0,
-        debug=0,
-        compute_hashes=False,
-        export_format=format_name,
-        config_file=None,
-        chunk_size=1000,
-        enable_progress=True,
-        analysis_profile=None
+        '/abs/test.mft',
+        expected_output,
+        0,
+        0,
+        False,
+        format_name,
+        None,
+        1000,
+        True,
+        None
     )
 
 @pytest.mark.asyncio
 async def test_main_with_debug_option(mock_analyzer):
-    test_args = ['analyzeMFT.py', '-f', 'test.mft', '-o', 'output.csv', '-d']
-    with patch.object(sys, 'argv', test_args):
+    test_args = ['analyzeMFT.py', '-f', 'test.mft', '-o', 'output.csv', '--debug']
+    with patch.object(sys, 'argv', test_args), \
+         patch('os.path.abspath', side_effect=lambda x: f'/abs/{x}'):
         await main()
 
     mock_analyzer.assert_called_once_with(
-        mft_file='test.mft',
-        output_file='output.csv',
-        verbosity=0,
-        debug=1,
-        compute_hashes=False,
-        export_format='csv',
-        config_file=None,
-        chunk_size=1000,
-        enable_progress=True,
-        analysis_profile=None
+        '/abs/test.mft',
+        '/abs/output.csv',
+        1,
+        0,
+        False,
+        'csv',
+        None,
+        1000,
+        True,
+        None
     )
 
 @pytest.mark.asyncio
 async def test_main_with_verbosity_option(mock_analyzer):
-    test_args = ['analyzeMFT.py', '-f', 'test.mft', '-o', 'output.csv', '-v']
-    with patch.object(sys, 'argv', test_args):
+    test_args = ['analyzeMFT.py', '-f', 'test.mft', '-o', 'output.csv', '--verbose']
+    with patch.object(sys, 'argv', test_args), \
+         patch('os.path.abspath', side_effect=lambda x: f'/abs/{x}'):
         await main()
 
     mock_analyzer.assert_called_once_with(
-        mft_file='test.mft',
-        output_file='output.csv',
-        verbosity=1,
-        debug=0,
-        compute_hashes=False,
-        export_format='csv',
-        config_file=None,
-        chunk_size=1000,
-        enable_progress=True,
-        analysis_profile=None
+        '/abs/test.mft',
+        '/abs/output.csv',
+        1,
+        0,
+        False,
+        'csv',
+        None,
+        1000,
+        True,
+        None
     )
 
 @pytest.mark.asyncio
 async def test_main_with_hash_option(mock_analyzer):
-    test_args = ['analyzeMFT.py', '-f', 'test.mft', '-o', 'output.csv', '-H']
-    with patch.object(sys, 'argv', test_args):
+    test_args = ['analyzeMFT.py', '-f', 'test.mft', '-o', 'output.csv', '--hash']
+    with patch.object(sys, 'argv', test_args), \
+         patch('os.path.abspath', side_effect=lambda x: f'/abs/{x}'):
         await main()
 
     mock_analyzer.assert_called_once_with(
-        mft_file='test.mft',
-        output_file='output.csv',
-        verbosity=0,
-        debug=0,
-        compute_hashes=True,
-        export_format='csv',
-        config_file=None,
-        chunk_size=1000,
-        enable_progress=True,
-        analysis_profile=None
+        '/abs/test.mft',
+        '/abs/output.csv',
+        0,
+        0,
+        True,
+        'csv',
+        None,
+        1000,
+        True,
+        None
     )
 
 @pytest.mark.asyncio
@@ -183,7 +189,8 @@ async def test_main_with_keyboard_interrupt(mock_analyzer, caplog):
 async def test_main_with_non_windows_platform(mock_analyzer):
     with patch('sys.platform', 'linux'):
         test_args = ['analyzeMFT.py', '-f', 'test.mft', '-o', 'output.csv']
-        with patch.object(sys, 'argv', test_args):
+        with patch.object(sys, 'argv', test_args), \
+             patch('os.path.abspath', side_effect=lambda x: f'/abs/{x}'):
             await main()
 
         mock_analyzer.assert_called_once()
@@ -194,23 +201,37 @@ def test_main_with_invalid_file_path(caplog):
         with pytest.raises(SystemExit):
             asyncio.run(main())
 
-    assert "Error reading MFT file" in caplog.text
-    assert "No such file or directory" in caplog.text or "not found" in caplog.text
+    assert ("Error reading MFT file" in caplog.text or "Validation Error" in caplog.text)
+    assert ("No such file or directory" in caplog.text or "not found" in caplog.text)
 
 def test_main_with_config_file(mock_analyzer):
     test_args = ['analyzeMFT.py', '-f', 'test.mft', '-o', 'output.csv', '-c', 'config.json']
-    with patch.object(sys, 'argv', test_args):
+    
+    mock_config_data = {'profile_name': 'default', 'verbosity': 1}
+    
+    from src.analyzeMFT.config import AnalysisProfile
+    mock_profile = AnalysisProfile(
+        name="test", 
+        export_format="csv",
+        verbosity=1,
+        chunk_size=1000
+    )
+    
+    with patch.object(sys, 'argv', test_args), \
+         patch('os.path.abspath', side_effect=lambda x: f'/abs/{x}'), \
+         patch('src.analyzeMFT.config.ConfigManager.load_config_file', return_value=mock_config_data), \
+         patch('src.analyzeMFT.config.ConfigManager.load_profile_from_config', return_value=mock_profile):
         asyncio.run(main())
 
-    mock_analyzer.assert_called_once_with(
-        mft_file='test.mft',
-        output_file='output.csv',
-        verbosity=0,
-        debug=0,
-        compute_hashes=False,
-        export_format='csv',
-        config_file='config.json',
-        chunk_size=1000,
-        enable_progress=True,
-        analysis_profile=None
-    )
+    # The actual call arguments from the CLI
+    mock_analyzer.assert_called_once()
+    
+    call_args = mock_analyzer.call_args[0]
+    assert call_args[0].endswith('test.mft')  # filename  
+    assert call_args[1].endswith('output.csv')  # output file
+    assert call_args[2] == 0  # verbosity from options (not profile)
+    assert call_args[3] == 1  # debug from profile  
+    assert call_args[4] == False  # compute hashes
+    assert call_args[5] == 'csv'  # export format
+    assert call_args[6] == mock_profile  # profile object
+    assert call_args[7] == 1000  # chunk size