added extra time staps to chapter content
This commit is contained in:
@@ -19,7 +19,6 @@ from typing import Optional, Union, Dict, Any
|
|||||||
import os
|
import os
|
||||||
import requests
|
import requests
|
||||||
import os
|
import os
|
||||||
from PyPDF2 import PdfReader
|
|
||||||
from scripts.transcriber import transcribe_media,group_words_into_sentences # Import the transcribe_media function
|
from scripts.transcriber import transcribe_media,group_words_into_sentences # Import the transcribe_media function
|
||||||
from scripts.generate_summary import general_summary,custom_summary
|
from scripts.generate_summary import general_summary,custom_summary
|
||||||
# Load environment variables
|
# Load environment variables
|
||||||
@@ -170,4 +169,6 @@ async def startup_event():
|
|||||||
|
|
||||||
if __name__ == "__main__":
|
if __name__ == "__main__":
|
||||||
import uvicorn
|
import uvicorn
|
||||||
uvicorn.run("app:app", host="0.0.0.0", port=3000, reload=True)
|
uvicorn.run("app:app", host="0.0.0.0", port=5056, reload=True)
|
||||||
|
|
||||||
|
|
||||||
+11
-3
@@ -25,7 +25,6 @@ At the end of each section, include a field named "minutes_total" which represen
|
|||||||
- The JSON output must be properly formatted and valid.
|
- The JSON output must be properly formatted and valid.
|
||||||
- Do not include any markdown or code block formatting markers (such as ```json) in your output.
|
- Do not include any markdown or code block formatting markers (such as ```json) in your output.
|
||||||
- Ensure that for each sentence you generate, every word in that sentence is assigned the same timestamp—the start timestamp of that sentence.
|
- Ensure that for each sentence you generate, every word in that sentence is assigned the same timestamp—the start timestamp of that sentence.
|
||||||
|
|
||||||
**Example Output JSON:**
|
**Example Output JSON:**
|
||||||
|
|
||||||
{
|
{
|
||||||
@@ -38,6 +37,11 @@ At the end of each section, include a field named "minutes_total" which represen
|
|||||||
{
|
{
|
||||||
"chapter": "Project Overview",
|
"chapter": "Project Overview",
|
||||||
"time_stamp": {"start": 5.12, "end": 5.68},
|
"time_stamp": {"start": 5.12, "end": 5.68},
|
||||||
|
"content": [
|
||||||
|
{"text":"- overview of the project's objectives.","original_transcript_start":3.4,"original_transcript_end":5.7},
|
||||||
|
{"text":"- It outlines the key milestones achieved so far.", "original_transcript_start":6.7, "original_transcript_end":10.5},
|
||||||
|
{"text":"- main challenges faced during the project.", "original_transcript_start":10.8, "original_transcript_end":11.2}
|
||||||
|
],
|
||||||
"words_time_stamp": [
|
"words_time_stamp": [
|
||||||
{"word": "Project", "timestamp": 5.12},
|
{"word": "Project", "timestamp": 5.12},
|
||||||
{"word": "Overview", "timestamp": 5.12}
|
{"word": "Overview", "timestamp": 5.12}
|
||||||
@@ -46,13 +50,17 @@ At the end of each section, include a field named "minutes_total" which represen
|
|||||||
{
|
{
|
||||||
"chapter": "Budget Review",
|
"chapter": "Budget Review",
|
||||||
"time_stamp": {"start": 10.50, "end": 11.20},
|
"time_stamp": {"start": 10.50, "end": 11.20},
|
||||||
|
"content": [
|
||||||
|
{"text":"- review of the current budget allocations.","original_transcript_start":10.5,"original_transcript_end":11.0},
|
||||||
|
{"text":"- discussion on potential cost-saving measures.", "original_transcript_start":11.1, "original_transcript_end":12.0},
|
||||||
|
{"text":"- approval of the budget for the next quarter.", "original_transcript_start":12.1, "original_transcript_end":13.0}
|
||||||
|
],
|
||||||
"words_time_stamp": [
|
"words_time_stamp": [
|
||||||
{"word": "Budget", "timestamp": 10.50},
|
{"word": "Budget", "timestamp": 10.50},
|
||||||
{"word": "Review", "timestamp": 10.50}
|
{"word": "Review", "timestamp": 10.50}
|
||||||
]
|
]
|
||||||
}
|
}
|
||||||
]
|
]
|
||||||
},
|
|
||||||
"Outcomes": {
|
"Outcomes": {
|
||||||
"minutes_total": 3,
|
"minutes_total": 3,
|
||||||
"content": [
|
"content": [
|
||||||
@@ -94,7 +102,7 @@ At the end of each section, include a field named "minutes_total" which represen
|
|||||||
]
|
]
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
NOTE: The content under each chapter provides a detailed bulleted explanation of the chapter. It includes "original_transcript_start" and "original_transcript_end," which indicate the timestamps for each bulleted point, referencing where to find it in the original transcript.
|
||||||
Remember, every word in each sentence must have a single timestamp equal to the start timestamp of that sentence. Your output must strictly adhere to the provided structure, and the "minutes_total" for each section must be correctly calculated based on the start time of the first sentence and the end time of the last sentence, expressed as a decimal if necessary.
|
Remember, every word in each sentence must have a single timestamp equal to the start timestamp of that sentence. Your output must strictly adhere to the provided structure, and the "minutes_total" for each section must be correctly calculated based on the start time of the first sentence and the end time of the last sentence, expressed as a decimal if necessary.
|
||||||
NOTE : start and end time are in seconds , so take that into considerations when calculating the total time in mins
|
NOTE : start and end time are in seconds , so take that into considerations when calculating the total time in mins
|
||||||
"""
|
"""
|
||||||
|
|||||||
Reference in New Issue
Block a user