99from collections .abc import Iterator
1010from datetime import datetime , timedelta , timezone
1111from pathlib import Path , PurePosixPath
12- from unittest .mock import patch
12+ from unittest .mock import Mock , patch
1313
1414import numpy as np
1515import pandas as pd
@@ -358,15 +358,24 @@ def test_to_storage(
358358 file_type ,
359359 num_threads ,
360360):
361+ mapper = Mock (side_effect = lambda file_path : len (file_path ))
362+
361363 ctc = cloud_test_catalog
362364 df = dc .read_storage (ctc .src_uri , type = file_type , session = test_session )
363365 if use_map :
364- df .settings (cache = use_cache ).map (
365- res = lambda file : file .export (tmp_dir / "output" , placement = placement )
366- ).exec ()
366+ (
367+ df .settings (cache = use_cache )
368+ .map (mapper , params = ["file.path" ], output = {"path_len" : int })
369+ .map (res = lambda file : file .export (tmp_dir / "output" , placement = placement ))
370+ .exec ()
371+ )
367372 else :
368- df .settings (cache = use_cache ).to_storage (
369- tmp_dir / "output" , placement = placement , num_threads = num_threads
373+ (
374+ df .settings (cache = use_cache )
375+ .map (mapper , params = ["file.path" ], output = {"path_len" : int })
376+ .to_storage (
377+ tmp_dir / "output" , placement = placement , num_threads = num_threads
378+ )
370379 )
371380
372381 expected = {
@@ -387,6 +396,8 @@ def test_to_storage(
387396 with open (tmp_dir / "output" / file_path ) as f :
388397 assert f .read () == expected [file .name ]
389398
399+ assert mapper .call_count == len (expected )
400+
390401
391402@pytest .mark .parametrize ("use_cache" , [True , False ])
392403def test_export_images_files (test_session , tmp_dir , tmp_path , use_cache ):
0 commit comments