@@ -99,9 +99,12 @@ async def ingest_media_record_task():
9999 self .segment_database .delete_document_segments_by_media_record_id ([media_record_id ])
100100 self .segment_database .delete_video_segments_by_media_record_id ([media_record_id ])
101101
102+ _logger .info ("Processing file of Type: " + record_type )
102103 if record_type == "PRESENTATION" or record_type == "DOCUMENT" :
104+ _logger .info ("Starting document processor for " + str (media_record_id ))
103105 document_processor = DocumentProcessor ()
104106 document_data = document_processor .process (download_url )
107+ _logger .info ("Generating embeddings for " + str (media_record_id ))
105108 self .__lecture_pdf_embedding_generator .generate_embeddings (document_data .pages )
106109 for segment in document_data .pages :
107110 thumbnail_bytes = io .BytesIO ()
@@ -116,10 +119,12 @@ async def ingest_media_record_task():
116119
117120 if config .current ["lecture_llm_generator" ]["document_summary_generator" ]["enabled" ]:
118121 # generate and store a summary of this media record
122+ _logger .info ("Generating summary for " + str (media_record_id ))
119123 self .__lecture_llm_generator .generate_summary_for_document (document_data )
120124
121125 self .media_record_info_database .upsert_media_record_info (media_record_id , document_data .summary , None )
122126 elif record_type == "VIDEO" :
127+ _logger .info ("Starting video processor for " + str (media_record_id ))
123128 video_processor = VideoProcessor (
124129 segment_image_similarity_threshold =
125130 config .current ["video_segmentation" ]["segment_image_similarity_threshold" ],
@@ -128,13 +133,16 @@ async def ingest_media_record_task():
128133 del video_processor
129134
130135 # generate text embeddings for the segments of the video
136+ _logger .info ("Generating embeddings for " + str (media_record_id ))
131137 self .__lecture_video_embedding_generator .generate_embeddings (video_data .segments )
132138
133139 # generate titles for the video's segments if llm features enabled
134140 if config .current ["lecture_llm_generator" ]["segment_title_generator" ]["enabled" ]:
141+ _logger .info ("Generating title for " + str (media_record_id ))
135142 self .__lecture_llm_generator .generate_titles_for_video (video_data )
136143 else :
137144 # otherwise set empty data/placeholders
145+ _logger .info ("LLM generator disabled. Setting placeholders." )
138146 video_data .summary = []
139147 for i , segment in enumerate (video_data .segments , start = 1 ):
140148 segment .title = "Section " + str (i )
@@ -177,6 +185,9 @@ async def ingest_media_record_task():
177185 priority ))
178186
179187 def __generate_tags (self ):
188+ """
189+ Generates the suggested tags for all media records and assessments. This will recreate all suggested tags
190+ """
180191 segments = self .segment_database .get_all_entity_segments ()
181192
182193 topic_model = TopicModel (segments )
@@ -188,6 +199,10 @@ def __generate_tags(self):
188199 self .__generate_tags_for_assessments (segments , topic_model )
189200
190201 def __generate_tags_for_media_records (self , segments , topic_model ):
202+ """
203+ Generates the suggested tags for all media records. This will recreate all suggested tags.
204+ This step will be skipped if no media records are found.
205+ """
191206 _logger .info ("Generating tags for media records." )
192207 media_records = self .media_record_info_database .get_all_media_records ()
193208 if not media_records : # check if media_records is empty
@@ -201,6 +216,10 @@ def __generate_tags_for_media_records(self, segments, topic_model):
201216 _logger .info ("Generated tags for media records." )
202217
203218 def __generate_tags_for_assessments (self , segments , topic_model ):
219+ """
220+ Generates the suggested tags for all assessments. This will recreate all suggested tags.
221+ This step will be skipped if no assessments are found.
222+ """
204223 _logger .info ("Generating tags for assesments." )
205224 assesments = self .assesment_database .get_all_assessments ()
206225 if not assesments : # check if assessments is empty
0 commit comments