@@ -21,7 +21,7 @@ def test_process_html_nonexistent_folder(self):
2121 assert result == []
2222
2323 @patch ("src.tools.process_html.glob.glob" )
24- @patch ("src.tools.process_html.UnstructuredHTMLLoader " )
24+ @patch ("src.tools.process_html.BSHTMLLoader " )
2525 @patch (
2626 "builtins.open" ,
2727 new_callable = mock_open ,
@@ -52,7 +52,7 @@ def test_process_html_without_splitting(
5252 assert result [0 ].metadata ["source" ] == "test.html"
5353
5454 @patch ("src.tools.process_html.glob.glob" )
55- @patch ("src.tools.process_html.UnstructuredHTMLLoader " )
55+ @patch ("src.tools.process_html.BSHTMLLoader " )
5656 @patch (
5757 "builtins.open" ,
5858 new_callable = mock_open ,
@@ -95,7 +95,7 @@ def test_process_html_with_splitting(
9595 mock_chunk .assert_called_once_with (500 , [mock_doc ])
9696
9797 @patch ("src.tools.process_html.glob.glob" )
98- @patch ("src.tools.process_html.UnstructuredHTMLLoader " )
98+ @patch ("src.tools.process_html.BSHTMLLoader " )
9999 @patch ("builtins.open" , new_callable = mock_open , read_data = "{}" )
100100 @patch ("src.tools.process_html.os.path.exists" )
101101 @patch ("src.tools.process_html.os.listdir" )
@@ -133,7 +133,7 @@ def test_process_html_split_without_chunk_size_raises_error(self):
133133 mock_open (read_data = '{"test.html": "https://example.com"}' ),
134134 ):
135135 with patch (
136- "src.tools.process_html.UnstructuredHTMLLoader "
136+ "src.tools.process_html.BSHTMLLoader "
137137 ) as mock_loader :
138138 mock_doc = Mock ()
139139 mock_doc .metadata = {"source" : "test.html" }
@@ -145,7 +145,7 @@ def test_process_html_split_without_chunk_size_raises_error(self):
145145 process_html (temp_dir , split_text = True , chunk_size = None )
146146
147147 @patch ("src.tools.process_html.glob.glob" )
148- @patch ("src.tools.process_html.UnstructuredHTMLLoader " )
148+ @patch ("src.tools.process_html.BSHTMLLoader " )
149149 @patch (
150150 "builtins.open" ,
151151 new_callable = mock_open ,
@@ -198,7 +198,7 @@ def test_process_html_logs_error_for_empty_folder(self, mock_logging):
198198
199199 @patch ("src.tools.process_html.logging" )
200200 @patch ("src.tools.process_html.glob.glob" )
201- @patch ("src.tools.process_html.UnstructuredHTMLLoader " )
201+ @patch ("src.tools.process_html.BSHTMLLoader " )
202202 @patch ("builtins.open" , new_callable = mock_open , read_data = "{}" )
203203 @patch ("src.tools.process_html.os.path.exists" )
204204 @patch ("src.tools.process_html.os.listdir" )
@@ -225,7 +225,7 @@ def test_process_html_logs_warning_for_missing_source(
225225 def test_process_html_metadata_transformation (self ):
226226 """Test that metadata is properly transformed."""
227227 with patch ("src.tools.process_html.glob.glob" ) as mock_glob :
228- with patch ("src.tools.process_html.UnstructuredHTMLLoader " ) as mock_loader :
228+ with patch ("src.tools.process_html.BSHTMLLoader " ) as mock_loader :
229229 with patch (
230230 "builtins.open" ,
231231 mock_open (read_data = '{"test.html": "https://example.com"}' ),
@@ -281,7 +281,7 @@ def test_process_html_real_file_structure(self):
281281 mock_open (read_data = '{"docs/html/test.html": "https://example.com"}' ),
282282 ):
283283 with patch (
284- "src.tools.process_html.UnstructuredHTMLLoader "
284+ "src.tools.process_html.BSHTMLLoader "
285285 ) as mock_loader :
286286 mock_doc = Mock ()
287287 mock_doc .metadata = {"source" : "test.html" }
0 commit comments