From 6b85b6cfefc439d9a421fe463cf65fad6d9a50bd Mon Sep 17 00:00:00 2001 From: Hackett Lai Date: Fri, 30 Aug 2024 15:30:36 +0800 Subject: [PATCH] v2.1.0 --- .DS_Store | Bin 6148 -> 6148 bytes README.md | 17 ++-- function.js | 238 ++++++++++++++++++++++++++++++++++------------------ index.html | 206 ++++++++++++++++++++++++++------------------- style.css | 205 ++++++++++++++++++++++++++++++-------------- 5 files changed, 431 insertions(+), 235 deletions(-) diff --git a/.DS_Store b/.DS_Store index f3aa7cedcac7c50092b60da4cf93b0a4c11ead77..f08e9e0dc317a09950146dc305b4110a377f9af6 100644 GIT binary patch delta 26 ecmZoMXffE}#mLf79ce$=k5K{4*j&UoNelpUIS66^ delta 26 ecmZoMXffE}#mK_&L&t8iAEN@8vAKwGk{AGO&IkYi diff --git a/README.md b/README.md index a49dad4..59885ad 100644 --- a/README.md +++ b/README.md @@ -1,16 +1,21 @@ # srt-to-word -Welcome to the SRT to DOCX Converter page, a user-friendly tool designed to transform your subtitle files into easily shareable Word documents. This versatile application allows you to upload SRT files, view the converted text directly within the webpage, and download a well-formatted DOCX file at your convenience. +Welcome to the SRT to DOCX Converter, your easy-to-use tool for transforming subtitle files. Just upload your .srt files, Select the desired conversion option, and once you're happy, save it as a handy .docx Word document. Simplifying subtitles has never been easier! -## Example Site +#### Example Site https://srt.hackettlai.com - +*** ## Features - **Simple File Upload:** Easily upload your `.srt` subtitle files using the integrated file input option. -- **Instant Text Display:** Once converted, your subtitle text is displayed instantly on the page, formatted for easy viewing and ready for review. - **Auto Deduction:** Automatically removes line numbers and timestamp lines from the SRT file. -- **Dialogues Summary:** Added a summary of the dialogue count. -- **Readability Enhancements:** The converted text maintains the original line breaks and section spacing, making it easier to navigate your subtitles. +- **Conversion Options:** There are three conversion options available. + - **Original Breaks:** Preserves original line breaks only. + - **Break on Punct:** Break on Punct: Strips out original line breaks and add line breaks after punctuation marks for each dialogue. + - **In Paragraphs:** Merges all dialogue and group them into paragraphs by adding line breaks after punctuation marks. +- **Scroll to First Line:** Automatically scroll to the first line of the converted text after each conversion. +- **Dialogues Summary:** Added a summary of the dialogue count at the beginning. +- **Punctuation Breaks:** Uses a regular expression `/("|\.{3}|\.|!|\?)[^\S\r\n]|(……|⋯⋯|。|!|?)(?![\n”"」』…⋯。!?]|$)/g` to add line breaks after punctuation marks automatically. + > Note: Punctuation Breaks only work for Break on Punct, In Paragraphs only. - **Save as Word Document:** Able to download the converted document in the `.docx` format for easy sharing and editing. diff --git a/function.js b/function.js index b19d3ef..4dfe78b 100644 --- a/function.js +++ b/function.js @@ -1,176 +1,250 @@ let docBlob; // Variable to store the docx blob -const btn_convert = document.getElementById("btn_convert"); -const btn_download = document.getElementById("btn_download"); -const fileInput = document.getElementById("srtFile"); - +const btn_convert_1 = document.getElementById('btn_convert_1'); +const btn_convert_2 = document.getElementById('btn_convert_2'); +const btn_convert_3 = document.getElementById('btn_convert_3'); +const btn_download = document.getElementById('btn_download'); +const fileInput = document.getElementById('srtFile'); +const result_div = document.getElementById('result_div'); // copyrightYear function to set the current year in the #thisYear element -window.addEventListener("load", copyright, true); +window.addEventListener('load', copyright, true); function copyright() { const thisYear = new Date().getFullYear(); - document.getElementById("thisYear").innerHTML = thisYear; + document.getElementById('thisYear').innerHTML = thisYear; } - // Enable the convert button once a file is selected -fileInput.addEventListener("change", function () { +fileInput.addEventListener('change', function () { if (fileInput.files.length > 0) { - btn_convert.disabled = false; - const resultDiv = document.getElementById("result_div"); - resultDiv.innerHTML = ""; // Clear any previous content + btn_convert_1.disabled = false; + btn_convert_2.disabled = false; + btn_convert_3.disabled = false; + const resultDiv = document.getElementById('result_div'); + resultDiv.innerHTML = ''; // Clear any previous content } else { - btn_convert.disabled = true; + btn_convert_1.disabled = true; + btn_convert_2.disabled = true; + btn_convert_3.disabled = true; } }); - // Start conversion process when the button is clicked -btn_convert.addEventListener("click", convertSrtToDocx); - +btn_convert_1.addEventListener('click', () => { + convertSrtToDocx(1); +}); +btn_convert_2.addEventListener('click', () => { + convertSrtToDocx(2); +}); +btn_convert_3.addEventListener('click', () => { + convertSrtToDocx(3); +}); // Converts an uploaded SRT file to DOCX format -function convertSrtToDocx() { +function convertSrtToDocx(convertMode) { + result_div.classList.add('glow'); // Add glow effect to the result div + setTimeout(() => { + result_div.classList.remove('glow'); + }, 400); const file = fileInput.files[0]; if (!file) { - alert("Please upload a .srt file first."); + alert('Please upload a .srt file first.'); return; } - const reader = new FileReader(); reader.onload = function (event) { const srtText = event.target.result; - const result = parseSrt(srtText); + let result; + if (convertMode === 1) { + result = parseSrtM1(srtText); + btn_convert_1.disabled = true; + btn_convert_2.disabled = false; + btn_convert_3.disabled = false; + } else if (convertMode === 2) { + result = parseSrtM2(srtText); + btn_convert_1.disabled = false; + btn_convert_2.disabled = true; + btn_convert_3.disabled = false; + } else if (convertMode === 3) { + result = parseSrtM3(srtText); + btn_convert_1.disabled = false; + btn_convert_2.disabled = false; + btn_convert_3.disabled = true; + } displayResult(result); + // Scroll to the first

inside result_div + const firstParagraph = result_div.querySelector('p'); + if (firstParagraph) { + firstParagraph.scrollIntoView({ behavior: 'smooth' }); + } }; reader.readAsText(file); - - btn_convert.disabled = true; btn_download.disabled = false; } - // Parses the SRT text into an array of sentences and counts the dialogues -function parseSrt(srtContent) { +// Mode 1: Preserves original line breaks only +function parseSrtM1(srtContent) { + // Split the SRT content by lines + const lines = srtContent.split('\n'); + // Initialize an empty array to store the trimmed dialogue + const trimmedDialogue = []; + // Initialize a variable to hold the current dialogue + let currentDialogue = []; + for (let i = 0; i < lines.length; i++) { + const line = lines[i].trim(); + // Skip the line number and timestamp lines + if (line === '' || /^\d+$/.test(line) || /^(\d{2}):(\d{2}):(\d{2}),(\d{3}) --> (\d{2}):(\d{2}):(\d{2}),(\d{3})$/.test(line)) { + // If we have accumulated dialogue, push it to the trimmedDialogue array + if (currentDialogue.length > 0) { + trimmedDialogue.push(currentDialogue.join('\n')); + currentDialogue = []; // Reset currentDialogue for the next dialogue + } + continue; // Skip to the next iteration + } + // If the line is part of the dialogue, add it to the currentDialogue + currentDialogue.push(line); + } + // After the loop, check if there's any remaining dialogue to push + if (currentDialogue.length > 0) { + trimmedDialogue.push(currentDialogue.join('\n')); + } + // Join all dialogues with an empty line between each + const parsedSentences = trimmedDialogue.join('\n\n\n'); + const dialogueCount = trimmedDialogue.length; + return { parsedSentences, dialogueCount }; +} +// Mode 2: Strips out original line breaks and add line breaks after punctuation marks for each dialogue +function parseSrtM2(srtContent) { // Split the SRT content by lines - const lines = srtContent.split("\n"); - + const lines = srtContent.split('\n'); // Initialize an empty array to store the trimmed dialogue const trimmedDialogue = []; - // Initialize a variable to hold the current dialogue let currentDialogue = []; - for (let i = 0; i < lines.length; i++) { const line = lines[i].trim(); - // Skip the line number and timestamp lines - if ( - line === "" || - /^\d+$/.test(line) || - /^(\d{2}):(\d{2}):(\d{2}),(\d{3}) --> (\d{2}):(\d{2}):(\d{2}),(\d{3})$/.test( - line - ) - ) { + if (line === '' || /^\d+$/.test(line) || /^(\d{2}):(\d{2}):(\d{2}),(\d{3}) --> (\d{2}):(\d{2}):(\d{2}),(\d{3})$/.test(line)) { // If we have accumulated dialogue, push it to the trimmedDialogue array if (currentDialogue.length > 0) { - trimmedDialogue.push(currentDialogue.join("\n")); + let joinedDialogue = currentDialogue.join(' '); // Join with a space + joinedDialogue = joinedDialogue.replace(/("|\.{3}|\.|!|\?)[^\S\r\n]|(……|⋯⋯|。|!|?)(?![\n”"」』…⋯。!?]|$)/g, '$1$2\n'); // Add line breaks + trimmedDialogue.push(joinedDialogue); currentDialogue = []; // Reset currentDialogue for the next dialogue } continue; // Skip to the next iteration } - // If the line is part of the dialogue, add it to the currentDialogue currentDialogue.push(line); } - // After the loop, check if there's any remaining dialogue to push if (currentDialogue.length > 0) { - trimmedDialogue.push(currentDialogue.join("\n")); + let joinedDialogue = currentDialogue.join(' '); // Join with a space + joinedDialogue = joinedDialogue.replace(/("|\.{3}|\.|!|\?)[^\S\r\n]|(……|⋯⋯|。|!|?)(?![\n”"」』…⋯。!?]|$)/g, '$1$2\n'); // Add line breaks + trimmedDialogue.push(joinedDialogue); } - // Join all dialogues with an empty line between each - const parsedSentences = trimmedDialogue.join("\n\n\n"); + const parsedSentences = trimmedDialogue.join('\n\n\n'); + const dialogueCount = trimmedDialogue.length; + return { parsedSentences, dialogueCount }; +} +// Mode 3: Merges all dialogue and group them into paragraphs by adding line breaks after punctuation marks +function parseSrtM3(srtContent) { + // Split the SRT content by lines + const lines = srtContent.split('\n'); + // Initialize an empty array to store the trimmed dialogue + const trimmedDialogue = []; + // Initialize a variable to hold the current dialogue + let currentDialogue = []; + for (let i = 0; i < lines.length; i++) { + const line = lines[i].trim(); + // Skip the line number and timestamp lines + if (line === '' || /^\d+$/.test(line) || /^(\d{2}):(\d{2}):(\d{2}),(\d{3}) --> (\d{2}):(\d{2}):(\d{2}),(\d{3})$/.test(line)) { + // If we have accumulated dialogue, push it to the trimmedDialogue array + if (currentDialogue.length > 0) { + trimmedDialogue.push(currentDialogue.join(' ')); + currentDialogue = []; // Reset currentDialogue for the next dialogue + } + continue; // Skip to the next iteration + } + // If the line is part of the dialogue, add it to the currentDialogue + currentDialogue.push(line); + } + // After the loop, check if there's any remaining dialogue to push + if (currentDialogue.length > 0) { + trimmedDialogue.push(currentDialogue.join(' ')); + } + // Join all dialogues with space between each + let parsedSentences = trimmedDialogue.join(' '); + // Use the regular expression to insert line breaks + parsedSentences = parsedSentences.replace(/("|\.{3}|\.|!|\?)[^\S\r\n]|(……|⋯⋯|。|!|?)(?![\n”"」』…⋯。!?]|$)/g, '$1$2\n\n\n'); const dialogueCount = trimmedDialogue.length; - return { parsedSentences, dialogueCount }; } - // Displays the parsed sentences in the result div function displayResult(result) { - const resultDiv = document.getElementById("result_div"); - resultDiv.innerHTML = ""; // Clear previous results - + const resultDiv = document.getElementById('result_div'); + resultDiv.innerHTML = ''; // Clear previous results // Display the count of dialogues - const countParagraph = document.createElement("p"); - countParagraph.textContent = `*** Total Dialogues: ${result.dialogueCount} ***`; + const countParagraph = document.createElement('p'); + countParagraph.textContent = `*** Original Dialogues: ${result.dialogueCount} ***`; resultDiv.appendChild(countParagraph); - // Add a space line - const spaceLine = document.createElement("p"); - spaceLine.innerHTML = "
"; + const spaceLine = document.createElement('p'); + spaceLine.innerHTML = '
'; resultDiv.appendChild(spaceLine); - // Ensure parsedSentences is a string - if (typeof result.parsedSentences === "string") { - result.parsedSentences.split("\n\n").forEach((sentence) => { - const p = document.createElement("p"); + if (typeof result.parsedSentences === 'string') { + result.parsedSentences.split('\n\n').forEach((sentence) => { + const p = document.createElement('p'); // Replace newline characters with
tags - p.innerHTML = sentence.replace(/\n/g, "
"); + p.innerHTML = sentence.replace(/\n/g, '
'); // If the sentence is empty, add a
tag - if (sentence === "") { - p.innerHTML = "
"; + if (sentence === '') { + p.innerHTML = '
'; } resultDiv.appendChild(p); }); } else { - console.error("Expected a string but got:", result.parsedSentences); + console.error('Expected a string but got:', result.parsedSentences); } - generateDocxFile(); // Prepare the docx file for download } - - // Generates a DOCX file from the parsed sentences function generateDocxFile() { - const resultDiv = document.getElementById("result_div"); - const paragraphs = resultDiv.querySelectorAll("p"); - + const resultDiv = document.getElementById('result_div'); + const paragraphs = resultDiv.querySelectorAll('p'); // Split each paragraph by
and create separate Paragraph objects const children = Array.from(paragraphs).flatMap((p) => { - return p.innerHTML - .split(//gi) - .map((line) => new docx.Paragraph(line.trim())); + return p.innerHTML.split(//gi).map((line) => new docx.Paragraph(line.trim())); }); - const doc = new docx.Document({ - creator: "SRT to DOCX Converter", - title: "Subtitle Document", + creator: 'SRT to DOCX Converter', + title: 'Subtitle Document', sections: [ { children: children, }, ], }); - docx.Packer.toBlob(doc).then((blob) => { docBlob = blob; // Store the blob for later download }); } - // Downloads the generated DOCX file function downloadDocx() { if (!docBlob) { - alert("Please convert a file before downloading."); + alert('Please convert a file before downloading.'); return; } - - const fileName = fileInput.files[0].name.replace(".srt", ""); + const fileName = fileInput.files[0].name.replace('.srt', ''); const url = URL.createObjectURL(docBlob); - const link = document.createElement("a"); + const link = document.createElement('a'); link.href = url; link.download = `${fileName}.docx`; link.click(); - // Reset after download - fileInput.value = ""; - const resultDiv = document.getElementById("result_div"); - resultDiv.innerHTML = ""; - btn_convert.disabled = true; + fileInput.value = ''; + const resultDiv = document.getElementById('result_div'); + resultDiv.innerHTML = ''; + btn_convert_1.disabled = true; + btn_convert_2.disabled = true; + btn_convert_3.disabled = true; btn_download.disabled = true; docBlob = null; } diff --git a/index.html b/index.html index 752c622..ee7c989 100644 --- a/index.html +++ b/index.html @@ -1,88 +1,126 @@ - - - - SRT Extractor - - - - - - - - - - - - - - - - - - - - - - - - -

SRT to DOCX Converter

-

Welcome to the SRT to DOCX Converter, your easy-to-use tool for transforming subtitle files. Just upload your .srt files, we'll strip out the timestamps for you and give you a neat summary of the dialogues, all while keeping the original line breaks and punctuation intact. Once you're happy, save everything as a handy .docx Word document. Simplifying subtitles has never been easier!

-
- - -
-
- - - -