@@ -1307,8 +1307,8 @@ async def test_parser_only_reader(pdf_parser: PDFParserFn, stub_data_dir: Path)
13071307 parse_pdf = pdf_parser ,
13081308 full_page = True , # Simple to support across many parsers
13091309 )
1310- assert parsed_text .metadata .summary
1311- assert "pdf" in parsed_text .metadata .summary
1310+ assert parsed_text .metadata .name
1311+ assert "pdf" in parsed_text .metadata .name
13121312 assert parsed_text .metadata .chunk_metadata is None
13131313 assert isinstance (parsed_text .content , dict )
13141314 num_chars = 0
@@ -1339,11 +1339,11 @@ async def test_chunk_metadata_reader(
13391339 include_metadata = True ,
13401340 parse_pdf = pdf_parser ,
13411341 )
1342- assert metadata .summary
1343- assert "pdf" in metadata .summary
1342+ assert metadata .name
1343+ assert "pdf" in metadata .name
13441344 assert isinstance (metadata .chunk_metadata , ChunkMetadata )
1345- assert metadata .chunk_metadata .summary
1346- assert "overlap-pdf" in metadata .chunk_metadata .summary
1345+ assert metadata .chunk_metadata .name
1346+ assert "overlap-pdf" in metadata .chunk_metadata .name
13471347 assert metadata .chunk_metadata .overlap == 100
13481348 assert metadata .chunk_metadata .size == 3000
13491349 assert len (chunk_text ) > 2 , "Expected multiple chunks, for meaningful assertions"
@@ -1380,11 +1380,11 @@ async def test_chunk_metadata_reader(
13801380 include_metadata = True ,
13811381 )
13821382 # NOTE the use of tiktoken changes the actual char and overlap counts
1383- assert metadata .summary
1384- assert "html" in metadata .summary
1383+ assert metadata .name
1384+ assert "html" in metadata .name
13851385 assert isinstance (metadata .chunk_metadata , ChunkMetadata )
1386- assert metadata .chunk_metadata .summary
1387- assert "overlap-text" in metadata .chunk_metadata .summary
1386+ assert metadata .chunk_metadata .name
1387+ assert "overlap-text" in metadata .chunk_metadata .name
13881388 assert metadata .chunk_metadata .overlap == 100
13891389 assert metadata .chunk_metadata .size == 3000
13901390 assert all (
@@ -1404,11 +1404,11 @@ async def test_chunk_metadata_reader(
14041404 doc = Doc (docname = "foo" , citation = "Foo et al, 2002" , dockey = "1" ),
14051405 include_metadata = True ,
14061406 )
1407- assert metadata .summary
1408- assert "txt" in metadata .summary
1407+ assert metadata .name
1408+ assert "txt" in metadata .name
14091409 assert isinstance (metadata .chunk_metadata , ChunkMetadata )
1410- assert metadata .chunk_metadata .summary
1411- assert "overlap-code" in metadata .chunk_metadata .summary
1410+ assert metadata .chunk_metadata .name
1411+ assert "overlap-code" in metadata .chunk_metadata .name
14121412 assert metadata .chunk_metadata .overlap == 100
14131413 assert metadata .chunk_metadata .size == 3000
14141414 assert all (
@@ -1483,8 +1483,8 @@ async def test_read_doc_images_metadata(stub_data_dir: Path) -> None:
14831483 image_id = parsed_image .to_id ()
14841484 assert image_id .version == 4 , "Expected a uuid4-compatible ID"
14851485 assert image_id == UUID ("f6426bc3-382a-45a4-8677-08744044864f" )
1486- assert parsed_text .metadata .summary
1487- assert "image" in parsed_text .metadata .summary
1486+ assert parsed_text .metadata .name
1487+ assert "image" in parsed_text .metadata .name
14881488 assert parsed_text .metadata .count_parsed_media == 1
14891489 assert parsed_text .metadata .total_parsed_text_length == 0
14901490 assert parsed_text .metadata .chunk_metadata is None
@@ -1502,15 +1502,15 @@ async def test_read_doc_images_metadata(stub_data_dir: Path) -> None:
15021502 texts , metadata = texts_with_metadata
15031503 assert len (texts ) == 1
15041504 assert texts [0 ] == text
1505- assert metadata .summary
1506- assert "image" in metadata .summary
1505+ assert metadata .name
1506+ assert "image" in metadata .name
15071507 assert metadata .count_parsed_media == 1
15081508 assert metadata .total_parsed_text_length == 0
15091509 assert metadata .chunk_metadata is not None
15101510 assert not metadata .chunk_metadata .size
15111511 assert not metadata .chunk_metadata .overlap
1512- assert metadata .chunk_metadata .summary
1513- assert "algorithm=none" in metadata .chunk_metadata .summary
1512+ assert metadata .chunk_metadata .name
1513+ assert "algorithm=none" in metadata .chunk_metadata .name
15141514
15151515
15161516@pytest .mark .asyncio
0 commit comments