UNPKG

9.07 kBSource Map (JSON)View Raw
1{"version":3,"sources":["webpack:///webpack/bootstrap","webpack:///./packages/stt-adapters/digital-paper-edit/group-words-by-speakers.js"],"names":["installedModules","__webpack_require__","moduleId","exports","module","i","l","modules","call","m","c","d","name","getter","o","Object","defineProperty","enumerable","get","r","Symbol","toStringTag","value","t","mode","__esModule","ns","create","key","bind","n","object","property","prototype","hasOwnProperty","p","s","groupWordsInParagraphsBySpeakers","words","segments","results","currentSegment","currentSegmentIndex","previousSegmentIndex","paragraph","text","speaker","forEach","word","find","seg","start","end","findSegmentForWord","indexOf","push","trim","addWordsToSpeakersParagraphs"],"mappings":"2BACE,IAAIA,EAAmB,GAGvB,SAASC,EAAoBC,GAG5B,GAAGF,EAAiBE,GACnB,OAAOF,EAAiBE,GAAUC,QAGnC,IAAIC,EAASJ,EAAiBE,GAAY,CACzCG,EAAGH,EACHI,GAAG,EACHH,QAAS,IAUV,OANAI,EAAQL,GAAUM,KAAKJ,EAAOD,QAASC,EAAQA,EAAOD,QAASF,GAG/DG,EAAOE,GAAI,EAGJF,EAAOD,QA0Df,OArDAF,EAAoBQ,EAAIF,EAGxBN,EAAoBS,EAAIV,EAGxBC,EAAoBU,EAAI,SAASR,EAASS,EAAMC,GAC3CZ,EAAoBa,EAAEX,EAASS,IAClCG,OAAOC,eAAeb,EAASS,EAAM,CAAEK,YAAY,EAAMC,IAAKL,KAKhEZ,EAAoBkB,EAAI,SAAShB,GACX,oBAAXiB,QAA0BA,OAAOC,aAC1CN,OAAOC,eAAeb,EAASiB,OAAOC,YAAa,CAAEC,MAAO,WAE7DP,OAAOC,eAAeb,EAAS,aAAc,CAAEmB,OAAO,KAQvDrB,EAAoBsB,EAAI,SAASD,EAAOE,GAEvC,GADU,EAAPA,IAAUF,EAAQrB,EAAoBqB,IAC/B,EAAPE,EAAU,OAAOF,EACpB,GAAW,EAAPE,GAA8B,iBAAVF,GAAsBA,GAASA,EAAMG,WAAY,OAAOH,EAChF,IAAII,EAAKX,OAAOY,OAAO,MAGvB,GAFA1B,EAAoBkB,EAAEO,GACtBX,OAAOC,eAAeU,EAAI,UAAW,CAAET,YAAY,EAAMK,MAAOA,IACtD,EAAPE,GAA4B,iBAATF,EAAmB,IAAI,IAAIM,KAAON,EAAOrB,EAAoBU,EAAEe,EAAIE,EAAK,SAASA,GAAO,OAAON,EAAMM,IAAQC,KAAK,KAAMD,IAC9I,OAAOF,GAIRzB,EAAoB6B,EAAI,SAAS1B,GAChC,IAAIS,EAAST,GAAUA,EAAOqB,WAC7B,WAAwB,OAAOrB,EAAgB,SAC/C,WAA8B,OAAOA,GAEtC,OADAH,EAAoBU,EAAEE,EAAQ,IAAKA,GAC5BA,GAIRZ,EAAoBa,EAAI,SAASiB,EAAQC,GAAY,OAAOjB,OAAOkB,UAAUC,eAAe1B,KAAKuB,EAAQC,IAGzG/B,EAAoBkC,EAAI,GAIjBlC,EAAoBA,EAAoBmC,EAAI,I,kCClFrD,OA4IeC,UA9Df,SAA0CC,EAAOC,GAG/C,OAGF,SAAuCD,EAAOC,GAAW,IACjDC,EAAU,GACZC,EAAiB,MACjBC,EAAsB,EACtBC,EAAuB,EACvBC,EAAY,CAAEN,MAAO,GAAIO,KAAM,GAAIC,QAAS,IAwBhD,OAvBAR,EAAMS,SAAQ,SAACC,IACbP,EAsCJ,SAA4BO,EAAMT,GAQhC,OANmBA,EAASU,MAAK,SAACC,GAChC,GAAKF,EAAKG,OAASD,EAAIC,OAAWH,EAAKI,KAAOF,EAAIE,IAChD,OAAOF,KA1CQG,CAAmBL,EAAMT,OAGxCG,EAAsBH,EAASe,QAAQb,MACXE,GAC1BC,EAAUN,MAAMiB,KAAKP,GACrBJ,EAAUC,MAAQG,EAAKH,KAAO,IAC9BD,EAAUE,QAAUL,EAAeK,UAGnCH,EAAuBD,EACvBE,EAAUC,KAAKW,OACfhB,EAAQe,KAAKX,IACbA,EAAY,CAAEN,MAAO,GAAIO,KAAM,GAAIC,QAAS,KAClCR,MAAMiB,KAAKP,GACrBJ,EAAUC,MAAQG,EAAKH,KAAO,IAC9BD,EAAUE,QAAUL,EAAeK,aAIzCN,EAAQe,KAAKX,GAENJ,EAlCQiB,CAA6BnB,EAAOC","file":"groupWordsInParagraphsBySpeakersDPE.js","sourcesContent":[" \t// The module cache\n \tvar installedModules = {};\n\n \t// The require function\n \tfunction __webpack_require__(moduleId) {\n\n \t\t// Check if module is in cache\n \t\tif(installedModules[moduleId]) {\n \t\t\treturn installedModules[moduleId].exports;\n \t\t}\n \t\t// Create a new module (and put it into the cache)\n \t\tvar module = installedModules[moduleId] = {\n \t\t\ti: moduleId,\n \t\t\tl: false,\n \t\t\texports: {}\n \t\t};\n\n \t\t// Execute the module function\n \t\tmodules[moduleId].call(module.exports, module, module.exports, __webpack_require__);\n\n \t\t// Flag the module as loaded\n \t\tmodule.l = true;\n\n \t\t// Return the exports of the module\n \t\treturn module.exports;\n \t}\n\n\n \t// expose the modules object (__webpack_modules__)\n \t__webpack_require__.m = modules;\n\n \t// expose the module cache\n \t__webpack_require__.c = installedModules;\n\n \t// define getter function for harmony exports\n \t__webpack_require__.d = function(exports, name, getter) {\n \t\tif(!__webpack_require__.o(exports, name)) {\n \t\t\tObject.defineProperty(exports, name, { enumerable: true, get: getter });\n \t\t}\n \t};\n\n \t// define __esModule on exports\n \t__webpack_require__.r = function(exports) {\n \t\tif(typeof Symbol !== 'undefined' && Symbol.toStringTag) {\n \t\t\tObject.defineProperty(exports, Symbol.toStringTag, { value: 'Module' });\n \t\t}\n \t\tObject.defineProperty(exports, '__esModule', { value: true });\n \t};\n\n \t// create a fake namespace object\n \t// mode & 1: value is a module id, require it\n \t// mode & 2: merge all properties of value into the ns\n \t// mode & 4: return value when already ns object\n \t// mode & 8|1: behave like require\n \t__webpack_require__.t = function(value, mode) {\n \t\tif(mode & 1) value = __webpack_require__(value);\n \t\tif(mode & 8) return value;\n \t\tif((mode & 4) && typeof value === 'object' && value && value.__esModule) return value;\n \t\tvar ns = Object.create(null);\n \t\t__webpack_require__.r(ns);\n \t\tObject.defineProperty(ns, 'default', { enumerable: true, value: value });\n \t\tif(mode & 2 && typeof value != 'string') for(var key in value) __webpack_require__.d(ns, key, function(key) { return value[key]; }.bind(null, key));\n \t\treturn ns;\n \t};\n\n \t// getDefaultExport function for compatibility with non-harmony modules\n \t__webpack_require__.n = function(module) {\n \t\tvar getter = module && module.__esModule ?\n \t\t\tfunction getDefault() { return module['default']; } :\n \t\t\tfunction getModuleExports() { return module; };\n \t\t__webpack_require__.d(getter, 'a', getter);\n \t\treturn getter;\n \t};\n\n \t// Object.prototype.hasOwnProperty.call\n \t__webpack_require__.o = function(object, property) { return Object.prototype.hasOwnProperty.call(object, property); };\n\n \t// __webpack_public_path__\n \t__webpack_require__.p = \"\";\n\n\n \t// Load entry module and return exports\n \treturn __webpack_require__(__webpack_require__.s = 48);\n","/**\n edge cases\n- more segments then words - not an issue if you start by matching words with segment\nand handle edge case where it doesn't find a match\n- more words then segments - orphan words?\n*\n* Takes in list of words and list of paragraphs (paragraphs have speakers info associated with it)\n```js\n{\n \"words\": [\n {\n \"id\": 0,\n \"start\": 13.02,\n \"end\": 13.17,\n \"text\": \"There\"\n },\n {\n \"id\": 1,\n \"start\": 13.17,\n \"end\": 13.38,\n \"text\": \"is\"\n },\n ...\n ],\n \"paragraphs\": [\n {\n \"id\": 0,\n \"start\": 13.02,\n \"end\": 13.86,\n \"speaker\": \"TBC 00\"\n },\n {\n \"id\": 1,\n \"start\": 13.86,\n \"end\": 19.58,\n \"speaker\": \"TBC 1\"\n },\n ...\n ]\n}\n```\n* and returns a list of words grouped into paragraphs, with words, text and speaker attribute\n```js\n[\n {\n \"words\": [\n {\n \"id\": 0,\n \"start\": 13.02,\n \"end\": 13.17,\n \"text\": \"There\"\n },\n {\n \"id\": 1,\n \"start\": 13.17,\n \"end\": 13.38,\n \"text\": \"is\"\n },\n {\n \"id\": 2,\n \"start\": 13.38,\n \"end\": 13.44,\n \"text\": \"a\"\n },\n {\n \"id\": 3,\n \"start\": 13.44,\n \"end\": 13.86,\n \"text\": \"day.\"\n }\n ],\n \"text\": \"There is a day.\",\n \"speaker\": \"TBC 00\"\n },\n ...\n]\n```\n */\nfunction groupWordsInParagraphsBySpeakers(words, segments) {\n const result = addWordsToSpeakersParagraphs(words, segments);\n\n return result;\n};\n\nfunction addWordsToSpeakersParagraphs (words, segments) {\n const results = [];\n let currentSegment = 'UKN';\n let currentSegmentIndex = 0;\n let previousSegmentIndex = 0;\n let paragraph = { words: [], text: '', speaker: '' };\n words.forEach((word) => {\n currentSegment = findSegmentForWord(word, segments);\n // if a segment exists for the word\n if (currentSegment) {\n currentSegmentIndex = segments.indexOf(currentSegment);\n if (currentSegmentIndex === previousSegmentIndex) {\n paragraph.words.push(word);\n paragraph.text += word.text + ' ';\n paragraph.speaker = currentSegment.speaker;\n }\n else {\n previousSegmentIndex = currentSegmentIndex;\n paragraph.text.trim();\n results.push(paragraph);\n paragraph = { words: [], text: '', speaker: '' };\n paragraph.words.push(word);\n paragraph.text += word.text + ' ';\n paragraph.speaker = currentSegment.speaker;\n }\n }\n });\n results.push(paragraph);\n\n return results;\n}\n\n/**\n* Helper functions\n*/\n\n/**\n* given word start and end time attributes\n* looks for segment range that contains that word\n* if it doesn't find any it returns a segment with `UKN`\n* speaker attributes.\n* @param {object} word - word object\n* @param {array} segments - list of segments objects\n* @return {object} - a single segment whose range contains the word\n*/\nfunction findSegmentForWord(word, segments) {\n\n const tmpSegment = segments.find((seg) => {\n if ((word.start >= seg.start) && (word.end <= seg.end)) {\n return seg;\n }\n });\n\n return tmpSegment;\n}\n\nexport default groupWordsInParagraphsBySpeakers;"],"sourceRoot":""}
\No newline at end of file