diff --git a/Dockerfile.cpu b/Dockerfile.cpu new file mode 100644 index 0000000000000000000000000000000000000000..dceffbfc595003c75680694d24e4de72536559c7 --- /dev/null +++ b/Dockerfile.cpu @@ -0,0 +1,35 @@ +FROM python:3.9 + +RUN apt-get update && \ + apt-get install -y --no-install-recommends \ + ffmpeg + +RUN python3 -m pip install --upgrade pip + +# Python installation +WORKDIR /usr/src/app + +# Force CPU versions of torch +RUN pip3 install \ + torch==1.13.1+cpu \ + torchaudio==0.13.1+cpu \ + -f https://download.pytorch.org/whl/torch_stable.html + +# Note: First installing the python requirements permits to save time when re-building after a source change. +COPY requirements.txt /usr/src/app/requirements.txt +RUN cd /usr/src/app/ && pip3 install -r requirements.txt + +# Copy source +COPY setup.py /usr/src/app/setup.py +COPY whisper_timestamped /usr/src/app/whisper_timestamped + +# Install +RUN cd /usr/src/app/ && pip3 install ".[dev]" + +# Cleanup +RUN rm -R /usr/src/app/requirements.txt /usr/src/app/setup.py /usr/src/app/whisper_timestamped + +# Copy tests +COPY tests /usr/src/app/tests + +ENTRYPOINT ["/bin/bash"] \ No newline at end of file diff --git a/LICENCE b/LICENCE new file mode 100644 index 0000000000000000000000000000000000000000..0ad25db4bd1d86c452db3f9602ccdbe172438f52 --- /dev/null +++ b/LICENCE @@ -0,0 +1,661 @@ + GNU AFFERO GENERAL PUBLIC LICENSE + Version 3, 19 November 2007 + + Copyright (C) 2007 Free Software Foundation, Inc. + Everyone is permitted to copy and distribute verbatim copies + of this license document, but changing it is not allowed. + + Preamble + + The GNU Affero General Public License is a free, copyleft license for +software and other kinds of works, specifically designed to ensure +cooperation with the community in the case of network server software. + + The licenses for most software and other practical works are designed +to take away your freedom to share and change the works. By contrast, +our General Public Licenses are intended to guarantee your freedom to +share and change all versions of a program--to make sure it remains free +software for all its users. + + When we speak of free software, we are referring to freedom, not +price. Our General Public Licenses are designed to make sure that you +have the freedom to distribute copies of free software (and charge for +them if you wish), that you receive source code or can get it if you +want it, that you can change the software or use pieces of it in new +free programs, and that you know you can do these things. + + Developers that use our General Public Licenses protect your rights +with two steps: (1) assert copyright on the software, and (2) offer +you this License which gives you legal permission to copy, distribute +and/or modify the software. + + A secondary benefit of defending all users' freedom is that +improvements made in alternate versions of the program, if they +receive widespread use, become available for other developers to +incorporate. Many developers of free software are heartened and +encouraged by the resulting cooperation. However, in the case of +software used on network servers, this result may fail to come about. +The GNU General Public License permits making a modified version and +letting the public access it on a server without ever releasing its +source code to the public. + + The GNU Affero General Public License is designed specifically to +ensure that, in such cases, the modified source code becomes available +to the community. It requires the operator of a network server to +provide the source code of the modified version running there to the +users of that server. Therefore, public use of a modified version, on +a publicly accessible server, gives the public access to the source +code of the modified version. + + An older license, called the Affero General Public License and +published by Affero, was designed to accomplish similar goals. This is +a different license, not a version of the Affero GPL, but Affero has +released a new version of the Affero GPL which permits relicensing under +this license. + + The precise terms and conditions for copying, distribution and +modification follow. + + TERMS AND CONDITIONS + + 0. Definitions. + + "This License" refers to version 3 of the GNU Affero General Public License. + + "Copyright" also means copyright-like laws that apply to other kinds of +works, such as semiconductor masks. + + "The Program" refers to any copyrightable work licensed under this +License. Each licensee is addressed as "you". "Licensees" and +"recipients" may be individuals or organizations. + + To "modify" a work means to copy from or adapt all or part of the work +in a fashion requiring copyright permission, other than the making of an +exact copy. The resulting work is called a "modified version" of the +earlier work or a work "based on" the earlier work. + + A "covered work" means either the unmodified Program or a work based +on the Program. + + To "propagate" a work means to do anything with it that, without +permission, would make you directly or secondarily liable for +infringement under applicable copyright law, except executing it on a +computer or modifying a private copy. Propagation includes copying, +distribution (with or without modification), making available to the +public, and in some countries other activities as well. + + To "convey" a work means any kind of propagation that enables other +parties to make or receive copies. Mere interaction with a user through +a computer network, with no transfer of a copy, is not conveying. + + An interactive user interface displays "Appropriate Legal Notices" +to the extent that it includes a convenient and prominently visible +feature that (1) displays an appropriate copyright notice, and (2) +tells the user that there is no warranty for the work (except to the +extent that warranties are provided), that licensees may convey the +work under this License, and how to view a copy of this License. If +the interface presents a list of user commands or options, such as a +menu, a prominent item in the list meets this criterion. + + 1. Source Code. + + The "source code" for a work means the preferred form of the work +for making modifications to it. "Object code" means any non-source +form of a work. + + A "Standard Interface" means an interface that either is an official +standard defined by a recognized standards body, or, in the case of +interfaces specified for a particular programming language, one that +is widely used among developers working in that language. + + The "System Libraries" of an executable work include anything, other +than the work as a whole, that (a) is included in the normal form of +packaging a Major Component, but which is not part of that Major +Component, and (b) serves only to enable use of the work with that +Major Component, or to implement a Standard Interface for which an +implementation is available to the public in source code form. A +"Major Component", in this context, means a major essential component +(kernel, window system, and so on) of the specific operating system +(if any) on which the executable work runs, or a compiler used to +produce the work, or an object code interpreter used to run it. + + The "Corresponding Source" for a work in object code form means all +the source code needed to generate, install, and (for an executable +work) run the object code and to modify the work, including scripts to +control those activities. However, it does not include the work's +System Libraries, or general-purpose tools or generally available free +programs which are used unmodified in performing those activities but +which are not part of the work. For example, Corresponding Source +includes interface definition files associated with source files for +the work, and the source code for shared libraries and dynamically +linked subprograms that the work is specifically designed to require, +such as by intimate data communication or control flow between those +subprograms and other parts of the work. + + The Corresponding Source need not include anything that users +can regenerate automatically from other parts of the Corresponding +Source. + + The Corresponding Source for a work in source code form is that +same work. + + 2. Basic Permissions. + + All rights granted under this License are granted for the term of +copyright on the Program, and are irrevocable provided the stated +conditions are met. This License explicitly affirms your unlimited +permission to run the unmodified Program. The output from running a +covered work is covered by this License only if the output, given its +content, constitutes a covered work. This License acknowledges your +rights of fair use or other equivalent, as provided by copyright law. + + You may make, run and propagate covered works that you do not +convey, without conditions so long as your license otherwise remains +in force. You may convey covered works to others for the sole purpose +of having them make modifications exclusively for you, or provide you +with facilities for running those works, provided that you comply with +the terms of this License in conveying all material for which you do +not control copyright. Those thus making or running the covered works +for you must do so exclusively on your behalf, under your direction +and control, on terms that prohibit them from making any copies of +your copyrighted material outside their relationship with you. + + Conveying under any other circumstances is permitted solely under +the conditions stated below. Sublicensing is not allowed; section 10 +makes it unnecessary. + + 3. Protecting Users' Legal Rights From Anti-Circumvention Law. + + No covered work shall be deemed part of an effective technological +measure under any applicable law fulfilling obligations under article +11 of the WIPO copyright treaty adopted on 20 December 1996, or +similar laws prohibiting or restricting circumvention of such +measures. + + When you convey a covered work, you waive any legal power to forbid +circumvention of technological measures to the extent such circumvention +is effected by exercising rights under this License with respect to +the covered work, and you disclaim any intention to limit operation or +modification of the work as a means of enforcing, against the work's +users, your or third parties' legal rights to forbid circumvention of +technological measures. + + 4. Conveying Verbatim Copies. + + You may convey verbatim copies of the Program's source code as you +receive it, in any medium, provided that you conspicuously and +appropriately publish on each copy an appropriate copyright notice; +keep intact all notices stating that this License and any +non-permissive terms added in accord with section 7 apply to the code; +keep intact all notices of the absence of any warranty; and give all +recipients a copy of this License along with the Program. + + You may charge any price or no price for each copy that you convey, +and you may offer support or warranty protection for a fee. + + 5. Conveying Modified Source Versions. + + You may convey a work based on the Program, or the modifications to +produce it from the Program, in the form of source code under the +terms of section 4, provided that you also meet all of these conditions: + + a) The work must carry prominent notices stating that you modified + it, and giving a relevant date. + + b) The work must carry prominent notices stating that it is + released under this License and any conditions added under section + 7. This requirement modifies the requirement in section 4 to + "keep intact all notices". + + c) You must license the entire work, as a whole, under this + License to anyone who comes into possession of a copy. This + License will therefore apply, along with any applicable section 7 + additional terms, to the whole of the work, and all its parts, + regardless of how they are packaged. This License gives no + permission to license the work in any other way, but it does not + invalidate such permission if you have separately received it. + + d) If the work has interactive user interfaces, each must display + Appropriate Legal Notices; however, if the Program has interactive + interfaces that do not display Appropriate Legal Notices, your + work need not make them do so. + + A compilation of a covered work with other separate and independent +works, which are not by their nature extensions of the covered work, +and which are not combined with it such as to form a larger program, +in or on a volume of a storage or distribution medium, is called an +"aggregate" if the compilation and its resulting copyright are not +used to limit the access or legal rights of the compilation's users +beyond what the individual works permit. Inclusion of a covered work +in an aggregate does not cause this License to apply to the other +parts of the aggregate. + + 6. Conveying Non-Source Forms. + + You may convey a covered work in object code form under the terms +of sections 4 and 5, provided that you also convey the +machine-readable Corresponding Source under the terms of this License, +in one of these ways: + + a) Convey the object code in, or embodied in, a physical product + (including a physical distribution medium), accompanied by the + Corresponding Source fixed on a durable physical medium + customarily used for software interchange. + + b) Convey the object code in, or embodied in, a physical product + (including a physical distribution medium), accompanied by a + written offer, valid for at least three years and valid for as + long as you offer spare parts or customer support for that product + model, to give anyone who possesses the object code either (1) a + copy of the Corresponding Source for all the software in the + product that is covered by this License, on a durable physical + medium customarily used for software interchange, for a price no + more than your reasonable cost of physically performing this + conveying of source, or (2) access to copy the + Corresponding Source from a network server at no charge. + + c) Convey individual copies of the object code with a copy of the + written offer to provide the Corresponding Source. This + alternative is allowed only occasionally and noncommercially, and + only if you received the object code with such an offer, in accord + with subsection 6b. + + d) Convey the object code by offering access from a designated + place (gratis or for a charge), and offer equivalent access to the + Corresponding Source in the same way through the same place at no + further charge. You need not require recipients to copy the + Corresponding Source along with the object code. If the place to + copy the object code is a network server, the Corresponding Source + may be on a different server (operated by you or a third party) + that supports equivalent copying facilities, provided you maintain + clear directions next to the object code saying where to find the + Corresponding Source. Regardless of what server hosts the + Corresponding Source, you remain obligated to ensure that it is + available for as long as needed to satisfy these requirements. + + e) Convey the object code using peer-to-peer transmission, provided + you inform other peers where the object code and Corresponding + Source of the work are being offered to the general public at no + charge under subsection 6d. + + A separable portion of the object code, whose source code is excluded +from the Corresponding Source as a System Library, need not be +included in conveying the object code work. + + A "User Product" is either (1) a "consumer product", which means any +tangible personal property which is normally used for personal, family, +or household purposes, or (2) anything designed or sold for incorporation +into a dwelling. In determining whether a product is a consumer product, +doubtful cases shall be resolved in favor of coverage. For a particular +product received by a particular user, "normally used" refers to a +typical or common use of that class of product, regardless of the status +of the particular user or of the way in which the particular user +actually uses, or expects or is expected to use, the product. A product +is a consumer product regardless of whether the product has substantial +commercial, industrial or non-consumer uses, unless such uses represent +the only significant mode of use of the product. + + "Installation Information" for a User Product means any methods, +procedures, authorization keys, or other information required to install +and execute modified versions of a covered work in that User Product from +a modified version of its Corresponding Source. The information must +suffice to ensure that the continued functioning of the modified object +code is in no case prevented or interfered with solely because +modification has been made. + + If you convey an object code work under this section in, or with, or +specifically for use in, a User Product, and the conveying occurs as +part of a transaction in which the right of possession and use of the +User Product is transferred to the recipient in perpetuity or for a +fixed term (regardless of how the transaction is characterized), the +Corresponding Source conveyed under this section must be accompanied +by the Installation Information. But this requirement does not apply +if neither you nor any third party retains the ability to install +modified object code on the User Product (for example, the work has +been installed in ROM). + + The requirement to provide Installation Information does not include a +requirement to continue to provide support service, warranty, or updates +for a work that has been modified or installed by the recipient, or for +the User Product in which it has been modified or installed. Access to a +network may be denied when the modification itself materially and +adversely affects the operation of the network or violates the rules and +protocols for communication across the network. + + Corresponding Source conveyed, and Installation Information provided, +in accord with this section must be in a format that is publicly +documented (and with an implementation available to the public in +source code form), and must require no special password or key for +unpacking, reading or copying. + + 7. Additional Terms. + + "Additional permissions" are terms that supplement the terms of this +License by making exceptions from one or more of its conditions. +Additional permissions that are applicable to the entire Program shall +be treated as though they were included in this License, to the extent +that they are valid under applicable law. If additional permissions +apply only to part of the Program, that part may be used separately +under those permissions, but the entire Program remains governed by +this License without regard to the additional permissions. + + When you convey a copy of a covered work, you may at your option +remove any additional permissions from that copy, or from any part of +it. (Additional permissions may be written to require their own +removal in certain cases when you modify the work.) You may place +additional permissions on material, added by you to a covered work, +for which you have or can give appropriate copyright permission. + + Notwithstanding any other provision of this License, for material you +add to a covered work, you may (if authorized by the copyright holders of +that material) supplement the terms of this License with terms: + + a) Disclaiming warranty or limiting liability differently from the + terms of sections 15 and 16 of this License; or + + b) Requiring preservation of specified reasonable legal notices or + author attributions in that material or in the Appropriate Legal + Notices displayed by works containing it; or + + c) Prohibiting misrepresentation of the origin of that material, or + requiring that modified versions of such material be marked in + reasonable ways as different from the original version; or + + d) Limiting the use for publicity purposes of names of licensors or + authors of the material; or + + e) Declining to grant rights under trademark law for use of some + trade names, trademarks, or service marks; or + + f) Requiring indemnification of licensors and authors of that + material by anyone who conveys the material (or modified versions of + it) with contractual assumptions of liability to the recipient, for + any liability that these contractual assumptions directly impose on + those licensors and authors. + + All other non-permissive additional terms are considered "further +restrictions" within the meaning of section 10. If the Program as you +received it, or any part of it, contains a notice stating that it is +governed by this License along with a term that is a further +restriction, you may remove that term. If a license document contains +a further restriction but permits relicensing or conveying under this +License, you may add to a covered work material governed by the terms +of that license document, provided that the further restriction does +not survive such relicensing or conveying. + + If you add terms to a covered work in accord with this section, you +must place, in the relevant source files, a statement of the +additional terms that apply to those files, or a notice indicating +where to find the applicable terms. + + Additional terms, permissive or non-permissive, may be stated in the +form of a separately written license, or stated as exceptions; +the above requirements apply either way. + + 8. Termination. + + You may not propagate or modify a covered work except as expressly +provided under this License. Any attempt otherwise to propagate or +modify it is void, and will automatically terminate your rights under +this License (including any patent licenses granted under the third +paragraph of section 11). + + However, if you cease all violation of this License, then your +license from a particular copyright holder is reinstated (a) +provisionally, unless and until the copyright holder explicitly and +finally terminates your license, and (b) permanently, if the copyright +holder fails to notify you of the violation by some reasonable means +prior to 60 days after the cessation. + + Moreover, your license from a particular copyright holder is +reinstated permanently if the copyright holder notifies you of the +violation by some reasonable means, this is the first time you have +received notice of violation of this License (for any work) from that +copyright holder, and you cure the violation prior to 30 days after +your receipt of the notice. + + Termination of your rights under this section does not terminate the +licenses of parties who have received copies or rights from you under +this License. If your rights have been terminated and not permanently +reinstated, you do not qualify to receive new licenses for the same +material under section 10. + + 9. Acceptance Not Required for Having Copies. + + You are not required to accept this License in order to receive or +run a copy of the Program. Ancillary propagation of a covered work +occurring solely as a consequence of using peer-to-peer transmission +to receive a copy likewise does not require acceptance. However, +nothing other than this License grants you permission to propagate or +modify any covered work. These actions infringe copyright if you do +not accept this License. Therefore, by modifying or propagating a +covered work, you indicate your acceptance of this License to do so. + + 10. Automatic Licensing of Downstream Recipients. + + Each time you convey a covered work, the recipient automatically +receives a license from the original licensors, to run, modify and +propagate that work, subject to this License. You are not responsible +for enforcing compliance by third parties with this License. + + An "entity transaction" is a transaction transferring control of an +organization, or substantially all assets of one, or subdividing an +organization, or merging organizations. If propagation of a covered +work results from an entity transaction, each party to that +transaction who receives a copy of the work also receives whatever +licenses to the work the party's predecessor in interest had or could +give under the previous paragraph, plus a right to possession of the +Corresponding Source of the work from the predecessor in interest, if +the predecessor has it or can get it with reasonable efforts. + + You may not impose any further restrictions on the exercise of the +rights granted or affirmed under this License. For example, you may +not impose a license fee, royalty, or other charge for exercise of +rights granted under this License, and you may not initiate litigation +(including a cross-claim or counterclaim in a lawsuit) alleging that +any patent claim is infringed by making, using, selling, offering for +sale, or importing the Program or any portion of it. + + 11. Patents. + + A "contributor" is a copyright holder who authorizes use under this +License of the Program or a work on which the Program is based. The +work thus licensed is called the contributor's "contributor version". + + A contributor's "essential patent claims" are all patent claims +owned or controlled by the contributor, whether already acquired or +hereafter acquired, that would be infringed by some manner, permitted +by this License, of making, using, or selling its contributor version, +but do not include claims that would be infringed only as a +consequence of further modification of the contributor version. For +purposes of this definition, "control" includes the right to grant +patent sublicenses in a manner consistent with the requirements of +this License. + + Each contributor grants you a non-exclusive, worldwide, royalty-free +patent license under the contributor's essential patent claims, to +make, use, sell, offer for sale, import and otherwise run, modify and +propagate the contents of its contributor version. + + In the following three paragraphs, a "patent license" is any express +agreement or commitment, however denominated, not to enforce a patent +(such as an express permission to practice a patent or covenant not to +sue for patent infringement). To "grant" such a patent license to a +party means to make such an agreement or commitment not to enforce a +patent against the party. + + If you convey a covered work, knowingly relying on a patent license, +and the Corresponding Source of the work is not available for anyone +to copy, free of charge and under the terms of this License, through a +publicly available network server or other readily accessible means, +then you must either (1) cause the Corresponding Source to be so +available, or (2) arrange to deprive yourself of the benefit of the +patent license for this particular work, or (3) arrange, in a manner +consistent with the requirements of this License, to extend the patent +license to downstream recipients. "Knowingly relying" means you have +actual knowledge that, but for the patent license, your conveying the +covered work in a country, or your recipient's use of the covered work +in a country, would infringe one or more identifiable patents in that +country that you have reason to believe are valid. + + If, pursuant to or in connection with a single transaction or +arrangement, you convey, or propagate by procuring conveyance of, a +covered work, and grant a patent license to some of the parties +receiving the covered work authorizing them to use, propagate, modify +or convey a specific copy of the covered work, then the patent license +you grant is automatically extended to all recipients of the covered +work and works based on it. + + A patent license is "discriminatory" if it does not include within +the scope of its coverage, prohibits the exercise of, or is +conditioned on the non-exercise of one or more of the rights that are +specifically granted under this License. You may not convey a covered +work if you are a party to an arrangement with a third party that is +in the business of distributing software, under which you make payment +to the third party based on the extent of your activity of conveying +the work, and under which the third party grants, to any of the +parties who would receive the covered work from you, a discriminatory +patent license (a) in connection with copies of the covered work +conveyed by you (or copies made from those copies), or (b) primarily +for and in connection with specific products or compilations that +contain the covered work, unless you entered into that arrangement, +or that patent license was granted, prior to 28 March 2007. + + Nothing in this License shall be construed as excluding or limiting +any implied license or other defenses to infringement that may +otherwise be available to you under applicable patent law. + + 12. No Surrender of Others' Freedom. + + If conditions are imposed on you (whether by court order, agreement or +otherwise) that contradict the conditions of this License, they do not +excuse you from the conditions of this License. If you cannot convey a +covered work so as to satisfy simultaneously your obligations under this +License and any other pertinent obligations, then as a consequence you may +not convey it at all. For example, if you agree to terms that obligate you +to collect a royalty for further conveying from those to whom you convey +the Program, the only way you could satisfy both those terms and this +License would be to refrain entirely from conveying the Program. + + 13. Remote Network Interaction; Use with the GNU General Public License. + + Notwithstanding any other provision of this License, if you modify the +Program, your modified version must prominently offer all users +interacting with it remotely through a computer network (if your version +supports such interaction) an opportunity to receive the Corresponding +Source of your version by providing access to the Corresponding Source +from a network server at no charge, through some standard or customary +means of facilitating copying of software. This Corresponding Source +shall include the Corresponding Source for any work covered by version 3 +of the GNU General Public License that is incorporated pursuant to the +following paragraph. + + Notwithstanding any other provision of this License, you have +permission to link or combine any covered work with a work licensed +under version 3 of the GNU General Public License into a single +combined work, and to convey the resulting work. The terms of this +License will continue to apply to the part which is the covered work, +but the work with which it is combined will remain governed by version +3 of the GNU General Public License. + + 14. Revised Versions of this License. + + The Free Software Foundation may publish revised and/or new versions of +the GNU Affero General Public License from time to time. Such new versions +will be similar in spirit to the present version, but may differ in detail to +address new problems or concerns. + + Each version is given a distinguishing version number. If the +Program specifies that a certain numbered version of the GNU Affero General +Public License "or any later version" applies to it, you have the +option of following the terms and conditions either of that numbered +version or of any later version published by the Free Software +Foundation. If the Program does not specify a version number of the +GNU Affero General Public License, you may choose any version ever published +by the Free Software Foundation. + + If the Program specifies that a proxy can decide which future +versions of the GNU Affero General Public License can be used, that proxy's +public statement of acceptance of a version permanently authorizes you +to choose that version for the Program. + + Later license versions may give you additional or different +permissions. However, no additional obligations are imposed on any +author or copyright holder as a result of your choosing to follow a +later version. + + 15. Disclaimer of Warranty. + + THERE IS NO WARRANTY FOR THE PROGRAM, TO THE EXTENT PERMITTED BY +APPLICABLE LAW. EXCEPT WHEN OTHERWISE STATED IN WRITING THE COPYRIGHT +HOLDERS AND/OR OTHER PARTIES PROVIDE THE PROGRAM "AS IS" WITHOUT WARRANTY +OF ANY KIND, EITHER EXPRESSED OR IMPLIED, INCLUDING, BUT NOT LIMITED TO, +THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR +PURPOSE. THE ENTIRE RISK AS TO THE QUALITY AND PERFORMANCE OF THE PROGRAM +IS WITH YOU. SHOULD THE PROGRAM PROVE DEFECTIVE, YOU ASSUME THE COST OF +ALL NECESSARY SERVICING, REPAIR OR CORRECTION. + + 16. Limitation of Liability. + + IN NO EVENT UNLESS REQUIRED BY APPLICABLE LAW OR AGREED TO IN WRITING +WILL ANY COPYRIGHT HOLDER, OR ANY OTHER PARTY WHO MODIFIES AND/OR CONVEYS +THE PROGRAM AS PERMITTED ABOVE, BE LIABLE TO YOU FOR DAMAGES, INCLUDING ANY +GENERAL, SPECIAL, INCIDENTAL OR CONSEQUENTIAL DAMAGES ARISING OUT OF THE +USE OR INABILITY TO USE THE PROGRAM (INCLUDING BUT NOT LIMITED TO LOSS OF +DATA OR DATA BEING RENDERED INACCURATE OR LOSSES SUSTAINED BY YOU OR THIRD +PARTIES OR A FAILURE OF THE PROGRAM TO OPERATE WITH ANY OTHER PROGRAMS), +EVEN IF SUCH HOLDER OR OTHER PARTY HAS BEEN ADVISED OF THE POSSIBILITY OF +SUCH DAMAGES. + + 17. Interpretation of Sections 15 and 16. + + If the disclaimer of warranty and limitation of liability provided +above cannot be given local legal effect according to their terms, +reviewing courts shall apply local law that most closely approximates +an absolute waiver of all civil liability in connection with the +Program, unless a warranty or assumption of liability accompanies a +copy of the Program in return for a fee. + + END OF TERMS AND CONDITIONS + + How to Apply These Terms to Your New Programs + + If you develop a new program, and you want it to be of the greatest +possible use to the public, the best way to achieve this is to make it +free software which everyone can redistribute and change under these terms. + + To do so, attach the following notices to the program. It is safest +to attach them to the start of each source file to most effectively +state the exclusion of warranty; and each file should have at least +the "copyright" line and a pointer to where the full notice is found. + + + Copyright (C) + + This program is free software: you can redistribute it and/or modify + it under the terms of the GNU Affero General Public License as published + by the Free Software Foundation, either version 3 of the License, or + (at your option) any later version. + + This program is distributed in the hope that it will be useful, + but WITHOUT ANY WARRANTY; without even the implied warranty of + MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the + GNU Affero General Public License for more details. + + You should have received a copy of the GNU Affero General Public License + along with this program. If not, see . + +Also add information on how to contact you by electronic and paper mail. + + If your software can interact with users remotely through a computer +network, you should also make sure that it provides a way for users to +get its source. For example, if your program is a web application, its +interface could display a "Source" link that leads users to an archive +of the code. There are many ways you could offer source, and different +solutions will be better for different programs; see section 13 for the +specific requirements. + + You should also get your employer (if you work as a programmer) or school, +if any, to sign a "copyright disclaimer" for the program, if necessary. +For more information on this, and how to apply and follow the GNU AGPL, see +. diff --git a/figs/VAD_auditok.png b/figs/VAD_auditok.png new file mode 100644 index 0000000000000000000000000000000000000000..9dbaa4adc16a3082df4a6b17ddb3e4dbc0d4c227 Binary files /dev/null and b/figs/VAD_auditok.png differ diff --git a/figs/VAD_silero_v3.1.png b/figs/VAD_silero_v3.1.png new file mode 100644 index 0000000000000000000000000000000000000000..5216ef11328b5437fe715c63f66c0b095e0442d8 Binary files /dev/null and b/figs/VAD_silero_v3.1.png differ diff --git a/figs/VAD_silero_v4.0.png b/figs/VAD_silero_v4.0.png new file mode 100644 index 0000000000000000000000000000000000000000..3b516f9a5ac8eebf05688f7689ae49ae0dc4f24b Binary files /dev/null and b/figs/VAD_silero_v4.0.png differ diff --git a/figs/example_alignement_plot.png b/figs/example_alignement_plot.png new file mode 100644 index 0000000000000000000000000000000000000000..504528ece2e36b2cec4990ccdfcdc1d771a14beb Binary files /dev/null and b/figs/example_alignement_plot.png differ diff --git a/requirements.txt b/requirements.txt new file mode 100644 index 0000000000000000000000000000000000000000..f5a15670950a2dca208b867d00ff408e2cd577f3 --- /dev/null +++ b/requirements.txt @@ -0,0 +1,3 @@ +Cython +dtw-python +openai-whisper \ No newline at end of file diff --git a/setup.py b/setup.py new file mode 100644 index 0000000000000000000000000000000000000000..e49e71edb8ef44278a78b9cdc4bdb88ef6eb0512 --- /dev/null +++ b/setup.py @@ -0,0 +1,58 @@ +import os + +from setuptools import setup, find_packages + +install_requires = [ + "Cython", + "dtw-python", + "openai-whisper", +] + +required_packages_filename = os.path.join(os.path.dirname(__file__), "requirements.txt") +if os.path.exists(required_packages_filename): + install_requires2 = [l.strip() for l in open(required_packages_filename).readlines()] + assert install_requires == install_requires2, f"requirements.txt is not up-to-date: {install_requires} != {install_requires2}" + +version = None +license = None +with open(os.path.join(os.path.dirname(__file__), "whisper_timestamped", "transcribe.py")) as f: + for line in f: + if line.strip().startswith("__version__"): + version = line.split("=")[1].strip().strip("\"'") + if version and license: + break + if line.strip().startswith("__license__"): + license = line.split("=")[1].strip().strip("\"'") + if version and license: + break +assert version and license + +description="Multi-lingual Automatic Speech Recognition (ASR) based on Whisper models, with accurate word timestamps, access to language detection confidence, several options for Voice Activity Detection (VAD), and more." + +setup( + name="whisper-timestamped", + py_modules=["whisper_timestamped"], + version=version, + description=description, + long_description=description+"\nSee https://github.com/linto-ai/whisper-timestamped for more information.", + long_description_content_type='text/markdown', + python_requires=">=3.7", + author="Jeronymous", + url="https://github.com/linto-ai/whisper-timestamped", + license=license, + packages=find_packages(exclude=["tests*"]), + install_requires=install_requires, + entry_points = { + 'console_scripts': [ + 'whisper_timestamped=whisper_timestamped.transcribe:cli', + 'whisper_timestamped_make_subtitles=whisper_timestamped.make_subtitles:cli' + ], + }, + include_package_data=True, + extras_require={ + 'dev': ['matplotlib', 'transformers'], + 'vad_silero': ['onnxruntime', 'torchaudio'], + 'vad_auditok': ['auditok'], + 'test': ['jsonschema'], + }, +) diff --git a/tests/__init__.py b/tests/__init__.py new file mode 100644 index 0000000000000000000000000000000000000000..8b137891791fe96927ad78e64b0aad7bded08bdc --- /dev/null +++ b/tests/__init__.py @@ -0,0 +1 @@ + diff --git a/tests/data/apollo11.mp3 b/tests/data/apollo11.mp3 new file mode 100644 index 0000000000000000000000000000000000000000..d9246ca9f73701df5270dd342bdca2d316eda5b3 Binary files /dev/null and b/tests/data/apollo11.mp3 differ diff --git a/tests/data/bonjour.wav b/tests/data/bonjour.wav new file mode 100644 index 0000000000000000000000000000000000000000..f03944e35c448f2226923356f7208d0234a6419a Binary files /dev/null and b/tests/data/bonjour.wav differ diff --git a/tests/data/bonjour_vous_allez_bien.mp3 b/tests/data/bonjour_vous_allez_bien.mp3 new file mode 100644 index 0000000000000000000000000000000000000000..53bd078e6610cca0bddf7dbcaff2b2a991028c51 Binary files /dev/null and b/tests/data/bonjour_vous_allez_bien.mp3 differ diff --git a/tests/data/empty.mp3 b/tests/data/empty.mp3 new file mode 100644 index 0000000000000000000000000000000000000000..a73b2f2f14d2f33beb872041f64abc0208eee70b Binary files /dev/null and b/tests/data/empty.mp3 differ diff --git a/tests/data/empty.wav b/tests/data/empty.wav new file mode 100644 index 0000000000000000000000000000000000000000..a15eb0580e1a5cd7cd4b4d3e610155a3a967c81b Binary files /dev/null and b/tests/data/empty.wav differ diff --git a/tests/data/gaenswein15.mp3 b/tests/data/gaenswein15.mp3 new file mode 100644 index 0000000000000000000000000000000000000000..48689cfe8af4a3873f7c988793bd48ab12523094 Binary files /dev/null and b/tests/data/gaenswein15.mp3 differ diff --git a/tests/data/gloria.mp3 b/tests/data/gloria.mp3 new file mode 100644 index 0000000000000000000000000000000000000000..8289f3989deb8bccd19b102b9530974600791798 Binary files /dev/null and b/tests/data/gloria.mp3 differ diff --git a/tests/data/japanese.mp3 b/tests/data/japanese.mp3 new file mode 100644 index 0000000000000000000000000000000000000000..10337faea507f73c0add491837ad997e5656741a Binary files /dev/null and b/tests/data/japanese.mp3 differ diff --git a/tests/data/laugh1.mp3 b/tests/data/laugh1.mp3 new file mode 100644 index 0000000000000000000000000000000000000000..c564abe8c4f87cbaa1ee1998f17a36a1592f5c61 Binary files /dev/null and b/tests/data/laugh1.mp3 differ diff --git a/tests/data/laugh2.mp3 b/tests/data/laugh2.mp3 new file mode 100644 index 0000000000000000000000000000000000000000..b8fb8840f31d416eab241969a1b5f2da067a6acf Binary files /dev/null and b/tests/data/laugh2.mp3 differ diff --git a/tests/data/no_punctuations.mp3.words.json b/tests/data/no_punctuations.mp3.words.json new file mode 100644 index 0000000000000000000000000000000000000000..46d20abcf33869ed2f4eda32988e19619cfaf7b4 --- /dev/null +++ b/tests/data/no_punctuations.mp3.words.json @@ -0,0 +1,68 @@ +{ + "text": " Dis-moi, est-ce que l'avion vole?", + "segments": [ + { + "id": 0, + "seek": 0, + "start": 0.4, + "end": 2.34, + "text": " Dis-moi, est-ce que l'avion vole?", + "tokens": [ + 50364, + 4208, + 12, + 29292, + 11, + 871, + 12, + 384, + 631, + 287, + 6, + 706, + 313, + 49877, + 2506, + 50494 + ], + "temperature": 0.0, + "avg_logprob": -0.3014036907869227, + "compression_ratio": 0.8048780487804879, + "no_speech_prob": 0.05134102329611778, + "confidence": 0.925, + "words": [ + { + "text": "Dis-moi", + "start": 0.4, + "end": 1.36, + "confidence": 0.801 + }, + { + "text": "est-ce", + "start": 1.36, + "end": 1.52, + "confidence": 0.966 + }, + { + "text": "que", + "start": 1.52, + "end": 1.64, + "confidence": 0.977 + }, + { + "text": "l'avion", + "start": 1.64, + "end": 2.02, + "confidence": 0.994 + }, + { + "text": "vole", + "start": 2.02, + "end": 2.34, + "confidence": 0.891 + } + ] + } + ], + "language": "fr" +} \ No newline at end of file diff --git a/tests/data/punctuations.mp3 b/tests/data/punctuations.mp3 new file mode 100644 index 0000000000000000000000000000000000000000..b797032d15a7fc9cd575f79bd6ec43e37e66e555 Binary files /dev/null and b/tests/data/punctuations.mp3 differ diff --git a/tests/data/radio_short.mp3 b/tests/data/radio_short.mp3 new file mode 100644 index 0000000000000000000000000000000000000000..1772d945c050cb88948fb3b4d7f84657e06a90d7 Binary files /dev/null and b/tests/data/radio_short.mp3 differ diff --git a/tests/data/smartphone.mp3 b/tests/data/smartphone.mp3 new file mode 100644 index 0000000000000000000000000000000000000000..9c1c12473bf6c5485426a4f563b1385fd039f243 Binary files /dev/null and b/tests/data/smartphone.mp3 differ diff --git a/tests/data/smartphone.mp3.words.json b/tests/data/smartphone.mp3.words.json new file mode 100644 index 0000000000000000000000000000000000000000..8cf211f5b9abc1b522e115e190503add6af20a12 --- /dev/null +++ b/tests/data/smartphone.mp3.words.json @@ -0,0 +1,4802 @@ +{ + "text": " C'est évident ce que dit Nicolas, mais je ne me l'étais jamais formulé comme ça. Ce qui fait la force du smartphone, c'est pas seulement l'accumulation des fonctions, mais la manière dont elles interagissent entre elles. Ce qui dit d'ailleurs sur la photo, c'est hyper convaincant. Alors évidemment, il faudrait ajouter les interfaces. L'écran tactile a été beaucoup très souvent mentionné. Mais bon, il faut dire qu'il profite aussi de 20 ans pendant lesquels les ordinateurs nous ont appris à cliquer sur des icônes. Sauf que le smartphone ajoute le toucher, ce qui rend le contact plus direct, plus sensible. Et puis évidemment, il faudrait parler aussi des applications qui permettent de contourner le côté touffu de la navigation web pour aller directement au but. Bref, tout ça, ce sont les conditions qui permettent de créer cet objet dont Nicolas dit qu'il est vraisemblablement inédit dans l'histoire de l'humanité. Mais ça, ça soulève une autre interrogation. Est-ce que le fait que cet objet soit inédit induit que notre rapport à lui est aussi un rapport inédit? Je veux dire, est-ce que le rapport qu'on a au smartphone est comparable à celui qu'on entretenait à d'autres objets techniques comme la voiture ou le téléphone? Il n'y a pas d'équivalent en fait. Et donc cette espèce de nouveauté dans la relation à l'objet, c'est fascinant et terrifiant. Parce qu'on a l'impression, comme le disent les utilisateurs et les services, d'être dépendants de cet objet, d'induire en fait une espèce de relation, de médiation avec le monde qui rend de l'ampleur et qui amène aussi à des formes de rejet. Donc, à objet inédit, rapport inédit. Et ce rapport, si j'en crois Nicolas, serait caractérisé par un mélange de dépendance et de rejet. Bon, en vrai, il faudrait remonter très très finement toute l'histoire des objets techniques et de leur insertion dans nos vies pour déterminer si ce rapport est totalement inédit. Mais j'ai l'impression comme ça que Nicolas ne se trompe pas vraiment. Pour autant que je sache, il y a eu plein de discussions autour de la voiture ou même du téléphone. Mais la dépendance n'était pas du même ordre. Donc le rejet non plus n'était pas du même ordre. On peut adorer sa bagnole, en avoir besoin pour plein de choses. Et bien, le soir, quand on va se coucher, on la laisse. On ne l'a pas dans la main quand on est au lit, on ne l'emmène pas au chiottes. On pouvait être énervé par son môme qui occupait la ligne de téléphone pendant une heure chaque soir pour discuter avec un copain. Mais ça ne ressemblait pas à ce qu'on peut ressentir à voir ce même môme aujourd'hui, continuellement avec son smartphone dans la main, comme si c'était une sorte de pacemaker externe, comme si le lâcher allait entraîner sa mort immédiate. Bon, je dis ça pour le môme, mais c'est évidemment valable pour nous aussi. Donc, rapport inédit. D'accord. Mais pourquoi a-t-on l'impression qu'on n'en sortira jamais? Est-ce qu'il faut en remettre la faute sur les gens qui ont créé cet outil merveilleux et diabolique, et diabolique parce que merveilleux? Les économistes parlent de dépendance du sentier. C'est l'idée qu'on est sur un sentier qui a été établi, soit volontairement en marchant dessus, soit en définissant des bornes, en définissant une signalétique.", + "segments": [ + { + "id": 0, + "seek": 0, + "start": 0.38, + "end": 3.62, + "text": " C'est évident ce que dit Nicolas, mais je ne me l'étais jamais formulé comme ça.", + "tokens": [ + 383, + 6, + 377, + 20090, + 1078, + 1769, + 631, + 6176, + 38268, + 11, + 2420, + 1506, + 408, + 385, + 287, + 6, + 22824, + 14540, + 49990, + 526, + 5173, + 2788, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.2362671656324374, + "compression_ratio": 1.6238532110091743, + "no_speech_prob": 0.15368737280368805, + "confidence": 0.935, + "words": [ + { + "text": "C'est", + "start": 0.38, + "end": 0.58, + "confidence": 0.961 + }, + { + "text": "évident", + "start": 0.58, + "end": 0.88, + "confidence": 0.984 + }, + { + "text": "ce", + "start": 0.88, + "end": 1.02, + "confidence": 0.663 + }, + { + "text": "que", + "start": 1.02, + "end": 1.08, + "confidence": 0.989 + }, + { + "text": "dit", + "start": 1.08, + "end": 1.2, + "confidence": 0.994 + }, + { + "text": "Nicolas,", + "start": 1.2, + "end": 1.78, + "confidence": 0.91 + }, + { + "text": "mais", + "start": 1.78, + "end": 1.9, + "confidence": 0.979 + }, + { + "text": "je", + "start": 1.9, + "end": 2.24, + "confidence": 0.981 + }, + { + "text": "ne", + "start": 2.24, + "end": 2.34, + "confidence": 0.837 + }, + { + "text": "me", + "start": 2.34, + "end": 2.38, + "confidence": 0.821 + }, + { + "text": "l'étais", + "start": 2.38, + "end": 2.58, + "confidence": 0.971 + }, + { + "text": "jamais", + "start": 2.58, + "end": 2.84, + "confidence": 0.989 + }, + { + "text": "formulé", + "start": 2.84, + "end": 3.26, + "confidence": 0.908 + }, + { + "text": "comme", + "start": 3.26, + "end": 3.42, + "confidence": 0.993 + }, + { + "text": "ça.", + "start": 3.42, + "end": 3.62, + "confidence": 0.975 + } + ] + }, + { + "id": 1, + "seek": 0, + "start": 4.08, + "end": 7.92, + "text": " Ce qui fait la force du smartphone, c'est pas seulement l'accumulation des fonctions,", + "tokens": [ + 8257, + 1956, + 3887, + 635, + 3464, + 1581, + 13307, + 11, + 269, + 6, + 377, + 1736, + 27772, + 287, + 6, + 8476, + 449, + 2776, + 730, + 17290, + 3916, + 11 + ], + "temperature": 0.0, + "avg_logprob": -0.2362671656324374, + "compression_ratio": 1.6238532110091743, + "no_speech_prob": 0.15368737280368805, + "confidence": 0.93, + "words": [ + { + "text": "Ce", + "start": 4.08, + "end": 4.26, + "confidence": 0.952 + }, + { + "text": "qui", + "start": 4.26, + "end": 4.34, + "confidence": 0.958 + }, + { + "text": "fait", + "start": 4.34, + "end": 4.48, + "confidence": 0.567 + }, + { + "text": "la", + "start": 4.48, + "end": 4.66, + "confidence": 0.972 + }, + { + "text": "force", + "start": 4.66, + "end": 5.0, + "confidence": 0.999 + }, + { + "text": "du", + "start": 5.0, + "end": 5.2, + "confidence": 0.996 + }, + { + "text": "smartphone,", + "start": 5.2, + "end": 5.88, + "confidence": 0.912 + }, + { + "text": "c'est", + "start": 5.88, + "end": 6.12, + "confidence": 0.879 + }, + { + "text": "pas", + "start": 6.12, + "end": 6.26, + "confidence": 0.991 + }, + { + "text": "seulement", + "start": 6.26, + "end": 6.52, + "confidence": 0.999 + }, + { + "text": "l'accumulation", + "start": 6.52, + "end": 7.38, + "confidence": 0.958 + }, + { + "text": "des", + "start": 7.38, + "end": 7.56, + "confidence": 0.983 + }, + { + "text": "fonctions,", + "start": 7.56, + "end": 7.92, + "confidence": 0.987 + } + ] + }, + { + "id": 2, + "seek": 0, + "start": 8.32, + "end": 10.88, + "text": " mais la manière dont elles interagissent entre elles.", + "tokens": [ + 2420, + 635, + 22267, + 9400, + 23576, + 728, + 559, + 25450, + 3962, + 23576, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.2362671656324374, + "compression_ratio": 1.6238532110091743, + "no_speech_prob": 0.15368737280368805, + "confidence": 0.977, + "words": [ + { + "text": "mais", + "start": 8.32, + "end": 8.44, + "confidence": 0.992 + }, + { + "text": "la", + "start": 8.44, + "end": 8.6, + "confidence": 0.995 + }, + { + "text": "manière", + "start": 8.6, + "end": 8.9, + "confidence": 0.999 + }, + { + "text": "dont", + "start": 8.9, + "end": 9.1, + "confidence": 0.978 + }, + { + "text": "elles", + "start": 9.1, + "end": 9.48, + "confidence": 0.967 + }, + { + "text": "interagissent", + "start": 9.48, + "end": 10.32, + "confidence": 0.964 + }, + { + "text": "entre", + "start": 10.32, + "end": 10.58, + "confidence": 0.955 + }, + { + "text": "elles.", + "start": 10.58, + "end": 10.88, + "confidence": 0.989 + } + ] + }, + { + "id": 3, + "seek": 0, + "start": 10.96, + "end": 13.0, + "text": " Ce qui dit d'ailleurs sur la photo, c'est hyper convaincant.", + "tokens": [ + 8257, + 1956, + 6176, + 274, + 6, + 19400, + 1022, + 635, + 5052, + 11, + 269, + 6, + 377, + 9848, + 3754, + 491, + 66, + 394, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.2362671656324374, + "compression_ratio": 1.6238532110091743, + "no_speech_prob": 0.15368737280368805, + "confidence": 0.906, + "words": [ + { + "text": "Ce", + "start": 10.96, + "end": 11.16, + "confidence": 0.608 + }, + { + "text": "qui", + "start": 11.16, + "end": 11.22, + "confidence": 0.769 + }, + { + "text": "dit", + "start": 11.22, + "end": 11.4, + "confidence": 0.983 + }, + { + "text": "d'ailleurs", + "start": 11.4, + "end": 11.56, + "confidence": 0.985 + }, + { + "text": "sur", + "start": 11.56, + "end": 11.72, + "confidence": 0.48 + }, + { + "text": "la", + "start": 11.72, + "end": 11.78, + "confidence": 0.984 + }, + { + "text": "photo,", + "start": 11.78, + "end": 12.12, + "confidence": 0.994 + }, + { + "text": "c'est", + "start": 12.12, + "end": 12.2, + "confidence": 0.997 + }, + { + "text": "hyper", + "start": 12.2, + "end": 12.42, + "confidence": 0.993 + }, + { + "text": "convaincant.", + "start": 12.42, + "end": 13.0, + "confidence": 0.982 + } + ] + }, + { + "id": 4, + "seek": 0, + "start": 13.34, + "end": 16.02, + "text": " Alors évidemment, il faudrait ajouter les interfaces.", + "tokens": [ + 9946, + 24724, + 11, + 1930, + 38694, + 8645, + 17680, + 23985, + 1512, + 28416, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.2362671656324374, + "compression_ratio": 1.6238532110091743, + "no_speech_prob": 0.15368737280368805, + "confidence": 0.912, + "words": [ + { + "text": "Alors", + "start": 13.34, + "end": 13.62, + "confidence": 0.584 + }, + { + "text": "évidemment,", + "start": 13.62, + "end": 14.34, + "confidence": 0.832 + }, + { + "text": "il", + "start": 14.34, + "end": 14.38, + "confidence": 0.953 + }, + { + "text": "faudrait", + "start": 14.38, + "end": 14.74, + "confidence": 0.996 + }, + { + "text": "ajouter", + "start": 14.74, + "end": 15.16, + "confidence": 0.992 + }, + { + "text": "les", + "start": 15.16, + "end": 15.52, + "confidence": 0.985 + }, + { + "text": "interfaces.", + "start": 15.52, + "end": 16.02, + "confidence": 0.984 + } + ] + }, + { + "id": 5, + "seek": 0, + "start": 16.22, + "end": 19.36, + "text": " L'écran tactile a été beaucoup très souvent mentionné.", + "tokens": [ + 441, + 6, + 9062, + 4257, + 47319, + 257, + 8862, + 8796, + 5732, + 20847, + 2152, + 15055, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.2362671656324374, + "compression_ratio": 1.6238532110091743, + "no_speech_prob": 0.15368737280368805, + "confidence": 0.923, + "words": [ + { + "text": "L'écran", + "start": 16.22, + "end": 16.7, + "confidence": 0.996 + }, + { + "text": "tactile", + "start": 16.7, + "end": 17.06, + "confidence": 0.986 + }, + { + "text": "a", + "start": 17.06, + "end": 17.26, + "confidence": 0.98 + }, + { + "text": "été", + "start": 17.26, + "end": 17.88, + "confidence": 0.974 + }, + { + "text": "beaucoup", + "start": 17.88, + "end": 18.28, + "confidence": 0.976 + }, + { + "text": "très", + "start": 18.28, + "end": 18.62, + "confidence": 0.447 + }, + { + "text": "souvent", + "start": 18.62, + "end": 18.9, + "confidence": 0.996 + }, + { + "text": "mentionné.", + "start": 18.9, + "end": 19.36, + "confidence": 0.978 + } + ] + }, + { + "id": 6, + "seek": 0, + "start": 19.84, + "end": 25.26, + "text": " Mais bon, il faut dire qu'il profite aussi de 20 ans pendant lesquels les ordinateurs nous ont appris à cliquer sur des icônes.", + "tokens": [ + 6313, + 4428, + 11, + 1930, + 8487, + 1264, + 421, + 6, + 388, + 1740, + 642, + 6212, + 368, + 945, + 1567, + 17338, + 1512, + 358, + 1625, + 1512, + 4792, + 13923, + 2156, + 4666, + 6592, + 724, + 5714, + 1531, + 596, + 23909, + 1022, + 730, + 4376, + 2851, + 4081, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.2362671656324374, + "compression_ratio": 1.6238532110091743, + "no_speech_prob": 0.15368737280368805, + "confidence": 0.92, + "words": [ + { + "text": "Mais", + "start": 19.84, + "end": 20.22, + "confidence": 0.943 + }, + { + "text": "bon,", + "start": 20.22, + "end": 20.52, + "confidence": 0.666 + }, + { + "text": "il", + "start": 20.52, + "end": 20.6, + "confidence": 0.99 + }, + { + "text": "faut", + "start": 20.6, + "end": 20.7, + "confidence": 0.99 + }, + { + "text": "dire", + "start": 20.7, + "end": 20.84, + "confidence": 0.995 + }, + { + "text": "qu'il", + "start": 20.84, + "end": 20.96, + "confidence": 0.88 + }, + { + "text": "profite", + "start": 20.96, + "end": 21.26, + "confidence": 0.995 + }, + { + "text": "aussi", + "start": 21.26, + "end": 21.68, + "confidence": 0.972 + }, + { + "text": "de", + "start": 21.68, + "end": 21.9, + "confidence": 0.97 + }, + { + "text": "20", + "start": 21.9, + "end": 22.1, + "confidence": 0.812 + }, + { + "text": "ans", + "start": 22.1, + "end": 22.32, + "confidence": 0.997 + }, + { + "text": "pendant", + "start": 22.32, + "end": 22.48, + "confidence": 0.723 + }, + { + "text": "lesquels", + "start": 22.48, + "end": 22.92, + "confidence": 0.98 + }, + { + "text": "les", + "start": 22.92, + "end": 23.04, + "confidence": 0.71 + }, + { + "text": "ordinateurs", + "start": 23.04, + "end": 23.54, + "confidence": 0.966 + }, + { + "text": "nous", + "start": 23.54, + "end": 23.72, + "confidence": 0.602 + }, + { + "text": "ont", + "start": 23.72, + "end": 23.82, + "confidence": 0.974 + }, + { + "text": "appris", + "start": 23.82, + "end": 24.1, + "confidence": 0.991 + }, + { + "text": "à", + "start": 24.1, + "end": 24.24, + "confidence": 0.828 + }, + { + "text": "cliquer", + "start": 24.24, + "end": 24.5, + "confidence": 0.989 + }, + { + "text": "sur", + "start": 24.5, + "end": 24.66, + "confidence": 0.984 + }, + { + "text": "des", + "start": 24.66, + "end": 24.94, + "confidence": 0.971 + }, + { + "text": "icônes.", + "start": 24.94, + "end": 25.26, + "confidence": 0.992 + } + ] + }, + { + "id": 7, + "seek": 2534, + "start": 25.42, + "end": 30.64, + "text": " Sauf que le smartphone ajoute le toucher, ce qui rend le contact plus direct, plus sensible.", + "tokens": [ + 318, + 9507, + 631, + 476, + 13307, + 17680, + 14040, + 476, + 2557, + 260, + 11, + 1769, + 1956, + 6125, + 476, + 3385, + 1804, + 2047, + 11, + 1804, + 25380, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.07923513396173461, + "compression_ratio": 1.6254416961130742, + "no_speech_prob": 3.4465685985196615e-06, + "confidence": 0.969, + "words": [ + { + "text": "Sauf", + "start": 25.42, + "end": 25.76, + "confidence": 0.99 + }, + { + "text": "que", + "start": 25.76, + "end": 26.26, + "confidence": 0.996 + }, + { + "text": "le", + "start": 26.26, + "end": 26.66, + "confidence": 0.632 + }, + { + "text": "smartphone", + "start": 26.66, + "end": 27.06, + "confidence": 0.996 + }, + { + "text": "ajoute", + "start": 27.06, + "end": 27.44, + "confidence": 0.991 + }, + { + "text": "le", + "start": 27.44, + "end": 27.62, + "confidence": 0.992 + }, + { + "text": "toucher,", + "start": 27.62, + "end": 28.18, + "confidence": 0.988 + }, + { + "text": "ce", + "start": 28.18, + "end": 28.22, + "confidence": 0.989 + }, + { + "text": "qui", + "start": 28.22, + "end": 28.28, + "confidence": 1.0 + }, + { + "text": "rend", + "start": 28.28, + "end": 28.48, + "confidence": 0.994 + }, + { + "text": "le", + "start": 28.48, + "end": 28.68, + "confidence": 0.993 + }, + { + "text": "contact", + "start": 28.68, + "end": 29.1, + "confidence": 0.999 + }, + { + "text": "plus", + "start": 29.1, + "end": 29.46, + "confidence": 0.985 + }, + { + "text": "direct,", + "start": 29.46, + "end": 30.22, + "confidence": 0.995 + }, + { + "text": "plus", + "start": 30.22, + "end": 30.26, + "confidence": 0.994 + }, + { + "text": "sensible.", + "start": 30.26, + "end": 30.64, + "confidence": 0.997 + } + ] + }, + { + "id": 8, + "seek": 2534, + "start": 31.04, + "end": 37.82, + "text": " Et puis évidemment, il faudrait parler aussi des applications qui permettent de contourner le côté touffu de la navigation web pour aller directement au but.", + "tokens": [ + 3790, + 9093, + 24724, + 11, + 1930, + 38694, + 8645, + 16421, + 6212, + 730, + 5821, + 1956, + 21540, + 317, + 368, + 21234, + 1193, + 476, + 18437, + 10095, + 602, + 84, + 368, + 635, + 17346, + 3670, + 2016, + 8722, + 37297, + 1609, + 457, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.07923513396173461, + "compression_ratio": 1.6254416961130742, + "no_speech_prob": 3.4465685985196615e-06, + "confidence": 0.892, + "words": [ + { + "text": "Et", + "start": 31.04, + "end": 31.22, + "confidence": 0.97 + }, + { + "text": "puis", + "start": 31.22, + "end": 31.36, + "confidence": 0.971 + }, + { + "text": "évidemment,", + "start": 31.36, + "end": 31.7, + "confidence": 0.875 + }, + { + "text": "il", + "start": 31.7, + "end": 31.74, + "confidence": 0.993 + }, + { + "text": "faudrait", + "start": 31.74, + "end": 31.94, + "confidence": 0.995 + }, + { + "text": "parler", + "start": 31.94, + "end": 32.12, + "confidence": 0.839 + }, + { + "text": "aussi", + "start": 32.12, + "end": 32.34, + "confidence": 0.977 + }, + { + "text": "des", + "start": 32.34, + "end": 32.48, + "confidence": 0.994 + }, + { + "text": "applications", + "start": 32.48, + "end": 32.9, + "confidence": 0.993 + }, + { + "text": "qui", + "start": 32.9, + "end": 33.18, + "confidence": 0.482 + }, + { + "text": "permettent", + "start": 33.18, + "end": 33.74, + "confidence": 0.992 + }, + { + "text": "de", + "start": 33.74, + "end": 33.96, + "confidence": 0.884 + }, + { + "text": "contourner", + "start": 33.96, + "end": 34.42, + "confidence": 0.959 + }, + { + "text": "le", + "start": 34.42, + "end": 34.52, + "confidence": 0.777 + }, + { + "text": "côté", + "start": 34.52, + "end": 34.8, + "confidence": 0.984 + }, + { + "text": "touffu", + "start": 34.8, + "end": 35.32, + "confidence": 0.741 + }, + { + "text": "de", + "start": 35.32, + "end": 35.72, + "confidence": 0.882 + }, + { + "text": "la", + "start": 35.72, + "end": 35.78, + "confidence": 0.992 + }, + { + "text": "navigation", + "start": 35.78, + "end": 36.24, + "confidence": 0.994 + }, + { + "text": "web", + "start": 36.24, + "end": 36.6, + "confidence": 0.854 + }, + { + "text": "pour", + "start": 36.6, + "end": 36.78, + "confidence": 0.583 + }, + { + "text": "aller", + "start": 36.78, + "end": 36.98, + "confidence": 0.987 + }, + { + "text": "directement", + "start": 36.98, + "end": 37.52, + "confidence": 0.997 + }, + { + "text": "au", + "start": 37.52, + "end": 37.68, + "confidence": 0.967 + }, + { + "text": "but.", + "start": 37.68, + "end": 37.82, + "confidence": 0.995 + } + ] + }, + { + "id": 9, + "seek": 2534, + "start": 37.82, + "end": 46.58, + "text": " Bref, tout ça, ce sont les conditions qui permettent de créer cet objet dont Nicolas dit qu'il est vraisemblablement inédit dans l'histoire de l'humanité.", + "tokens": [ + 49957, + 11, + 3486, + 2788, + 11, + 1769, + 4900, + 1512, + 4487, + 1956, + 21540, + 317, + 368, + 32062, + 8603, + 14964, + 9400, + 38268, + 6176, + 421, + 6, + 388, + 871, + 6070, + 271, + 443, + 5199, + 712, + 518, + 294, + 7811, + 270, + 2680, + 287, + 6, + 29093, + 368, + 287, + 6, + 18796, + 5066, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.07923513396173461, + "compression_ratio": 1.6254416961130742, + "no_speech_prob": 3.4465685985196615e-06, + "confidence": 0.974, + "words": [ + { + "text": "Bref,", + "start": 37.82, + "end": 38.76, + "confidence": 0.987 + }, + { + "text": "tout", + "start": 38.76, + "end": 38.98, + "confidence": 0.711 + }, + { + "text": "ça,", + "start": 38.98, + "end": 39.42, + "confidence": 0.995 + }, + { + "text": "ce", + "start": 39.42, + "end": 39.7, + "confidence": 0.993 + }, + { + "text": "sont", + "start": 39.7, + "end": 39.88, + "confidence": 0.999 + }, + { + "text": "les", + "start": 39.88, + "end": 40.16, + "confidence": 0.991 + }, + { + "text": "conditions", + "start": 40.16, + "end": 40.68, + "confidence": 0.995 + }, + { + "text": "qui", + "start": 40.68, + "end": 40.96, + "confidence": 0.997 + }, + { + "text": "permettent", + "start": 40.96, + "end": 41.46, + "confidence": 0.997 + }, + { + "text": "de", + "start": 41.46, + "end": 41.6, + "confidence": 0.998 + }, + { + "text": "créer", + "start": 41.6, + "end": 42.06, + "confidence": 0.998 + }, + { + "text": "cet", + "start": 42.06, + "end": 42.38, + "confidence": 0.998 + }, + { + "text": "objet", + "start": 42.38, + "end": 42.6, + "confidence": 0.994 + }, + { + "text": "dont", + "start": 42.6, + "end": 42.8, + "confidence": 0.78 + }, + { + "text": "Nicolas", + "start": 42.8, + "end": 43.26, + "confidence": 0.989 + }, + { + "text": "dit", + "start": 43.26, + "end": 43.5, + "confidence": 0.986 + }, + { + "text": "qu'il", + "start": 43.5, + "end": 43.7, + "confidence": 0.983 + }, + { + "text": "est", + "start": 43.7, + "end": 43.88, + "confidence": 0.991 + }, + { + "text": "vraisemblablement", + "start": 43.88, + "end": 44.98, + "confidence": 0.991 + }, + { + "text": "inédit", + "start": 44.98, + "end": 45.38, + "confidence": 0.981 + }, + { + "text": "dans", + "start": 45.38, + "end": 45.7, + "confidence": 0.969 + }, + { + "text": "l'histoire", + "start": 45.7, + "end": 45.98, + "confidence": 0.957 + }, + { + "text": "de", + "start": 45.98, + "end": 46.18, + "confidence": 0.999 + }, + { + "text": "l'humanité.", + "start": 46.18, + "end": 46.58, + "confidence": 0.992 + } + ] + }, + { + "id": 10, + "seek": 2534, + "start": 46.6, + "end": 48.82, + "text": " Mais ça, ça soulève une autre interrogation.", + "tokens": [ + 6313, + 2788, + 11, + 2788, + 5133, + 31397, + 2251, + 15081, + 24871, + 399, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.07923513396173461, + "compression_ratio": 1.6254416961130742, + "no_speech_prob": 3.4465685985196615e-06, + "confidence": 0.969, + "words": [ + { + "text": "Mais", + "start": 46.6, + "end": 47.24, + "confidence": 0.845 + }, + { + "text": "ça,", + "start": 47.24, + "end": 47.72, + "confidence": 0.934 + }, + { + "text": "ça", + "start": 47.72, + "end": 47.76, + "confidence": 0.977 + }, + { + "text": "soulève", + "start": 47.76, + "end": 47.84, + "confidence": 0.993 + }, + { + "text": "une", + "start": 47.84, + "end": 48.02, + "confidence": 0.998 + }, + { + "text": "autre", + "start": 48.02, + "end": 48.26, + "confidence": 0.999 + }, + { + "text": "interrogation.", + "start": 48.26, + "end": 48.82, + "confidence": 0.997 + } + ] + }, + { + "id": 11, + "seek": 4884, + "start": 49.22, + "end": 55.46, + "text": " Est-ce que le fait que cet objet soit inédit induit que notre rapport à lui est aussi un rapport inédit?", + "tokens": [ + 4410, + 12, + 384, + 631, + 476, + 3887, + 631, + 8603, + 14964, + 12703, + 294, + 7811, + 270, + 13716, + 270, + 631, + 10349, + 18018, + 1531, + 8783, + 871, + 6212, + 517, + 18018, + 294, + 7811, + 270, + 2506 + ], + "temperature": 0.0, + "avg_logprob": -0.10683460109281225, + "compression_ratio": 1.662379421221865, + "no_speech_prob": 1.2805365258827806e-05, + "confidence": 0.988, + "words": [ + { + "text": "Est-ce", + "start": 49.22, + "end": 49.62, + "confidence": 0.982 + }, + { + "text": "que", + "start": 49.62, + "end": 49.72, + "confidence": 0.991 + }, + { + "text": "le", + "start": 49.72, + "end": 49.82, + "confidence": 0.993 + }, + { + "text": "fait", + "start": 49.82, + "end": 49.98, + "confidence": 0.999 + }, + { + "text": "que", + "start": 49.98, + "end": 50.14, + "confidence": 0.991 + }, + { + "text": "cet", + "start": 50.14, + "end": 50.32, + "confidence": 0.991 + }, + { + "text": "objet", + "start": 50.32, + "end": 50.66, + "confidence": 0.997 + }, + { + "text": "soit", + "start": 50.66, + "end": 51.12, + "confidence": 0.995 + }, + { + "text": "inédit", + "start": 51.12, + "end": 51.8, + "confidence": 0.995 + }, + { + "text": "induit", + "start": 51.8, + "end": 52.32, + "confidence": 0.976 + }, + { + "text": "que", + "start": 52.32, + "end": 52.42, + "confidence": 0.983 + }, + { + "text": "notre", + "start": 52.42, + "end": 52.72, + "confidence": 0.996 + }, + { + "text": "rapport", + "start": 52.72, + "end": 53.28, + "confidence": 0.997 + }, + { + "text": "à", + "start": 53.28, + "end": 53.44, + "confidence": 0.978 + }, + { + "text": "lui", + "start": 53.44, + "end": 53.66, + "confidence": 0.999 + }, + { + "text": "est", + "start": 53.66, + "end": 54.02, + "confidence": 0.915 + }, + { + "text": "aussi", + "start": 54.02, + "end": 54.54, + "confidence": 0.995 + }, + { + "text": "un", + "start": 54.54, + "end": 54.7, + "confidence": 0.995 + }, + { + "text": "rapport", + "start": 54.7, + "end": 55.0, + "confidence": 0.996 + }, + { + "text": "inédit?", + "start": 55.0, + "end": 55.46, + "confidence": 0.996 + } + ] + }, + { + "id": 12, + "seek": 4884, + "start": 55.46, + "end": 63.12, + "text": " Je veux dire, est-ce que le rapport qu'on a au smartphone est comparable à celui qu'on entretenait à d'autres objets techniques comme la voiture ou le téléphone?", + "tokens": [ + 2588, + 16389, + 1264, + 11, + 871, + 12, + 384, + 631, + 476, + 18018, + 421, + 6, + 266, + 257, + 1609, + 13307, + 871, + 25323, + 1531, + 22829, + 421, + 6, + 266, + 3962, + 1147, + 1001, + 1531, + 274, + 6, + 16752, + 1111, + 25349, + 7512, + 5173, + 635, + 38859, + 2820, + 476, + 47159, + 2506 + ], + "temperature": 0.0, + "avg_logprob": -0.10683460109281225, + "compression_ratio": 1.662379421221865, + "no_speech_prob": 1.2805365258827806e-05, + "confidence": 0.965, + "words": [ + { + "text": "Je", + "start": 55.46, + "end": 55.9, + "confidence": 0.879 + }, + { + "text": "veux", + "start": 55.9, + "end": 56.0, + "confidence": 0.988 + }, + { + "text": "dire,", + "start": 56.0, + "end": 56.24, + "confidence": 0.997 + }, + { + "text": "est-ce", + "start": 56.24, + "end": 56.36, + "confidence": 0.99 + }, + { + "text": "que", + "start": 56.36, + "end": 56.42, + "confidence": 0.99 + }, + { + "text": "le", + "start": 56.42, + "end": 56.58, + "confidence": 0.995 + }, + { + "text": "rapport", + "start": 56.58, + "end": 56.88, + "confidence": 0.998 + }, + { + "text": "qu'on", + "start": 56.88, + "end": 57.04, + "confidence": 0.985 + }, + { + "text": "a", + "start": 57.04, + "end": 57.18, + "confidence": 0.989 + }, + { + "text": "au", + "start": 57.18, + "end": 57.28, + "confidence": 0.967 + }, + { + "text": "smartphone", + "start": 57.28, + "end": 57.6, + "confidence": 0.994 + }, + { + "text": "est", + "start": 57.6, + "end": 57.92, + "confidence": 0.949 + }, + { + "text": "comparable", + "start": 57.92, + "end": 58.24, + "confidence": 0.997 + }, + { + "text": "à", + "start": 58.24, + "end": 58.48, + "confidence": 0.95 + }, + { + "text": "celui", + "start": 58.48, + "end": 58.66, + "confidence": 0.998 + }, + { + "text": "qu'on", + "start": 58.66, + "end": 58.9, + "confidence": 0.989 + }, + { + "text": "entretenait", + "start": 58.9, + "end": 59.32, + "confidence": 0.929 + }, + { + "text": "à", + "start": 59.32, + "end": 59.46, + "confidence": 0.959 + }, + { + "text": "d'autres", + "start": 59.46, + "end": 59.7, + "confidence": 0.997 + }, + { + "text": "objets", + "start": 59.7, + "end": 59.96, + "confidence": 0.991 + }, + { + "text": "techniques", + "start": 59.96, + "end": 60.46, + "confidence": 0.983 + }, + { + "text": "comme", + "start": 60.46, + "end": 60.88, + "confidence": 0.586 + }, + { + "text": "la", + "start": 60.88, + "end": 61.5, + "confidence": 0.987 + }, + { + "text": "voiture", + "start": 61.5, + "end": 62.06, + "confidence": 1.0 + }, + { + "text": "ou", + "start": 62.06, + "end": 62.36, + "confidence": 0.946 + }, + { + "text": "le", + "start": 62.36, + "end": 62.68, + "confidence": 0.998 + }, + { + "text": "téléphone?", + "start": 62.68, + "end": 63.12, + "confidence": 0.999 + } + ] + }, + { + "id": 13, + "seek": 4884, + "start": 63.36, + "end": 66.66, + "text": " Il n'y a pas d'équivalent en fait.", + "tokens": [ + 4416, + 297, + 6, + 88, + 257, + 1736, + 274, + 6, + 20183, + 3576, + 317, + 465, + 3887, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.10683460109281225, + "compression_ratio": 1.662379421221865, + "no_speech_prob": 1.2805365258827806e-05, + "confidence": 0.936, + "words": [ + { + "text": "Il", + "start": 63.36, + "end": 65.42, + "confidence": 0.778 + }, + { + "text": "n'y", + "start": 65.42, + "end": 65.48, + "confidence": 0.978 + }, + { + "text": "a", + "start": 65.48, + "end": 65.54, + "confidence": 0.992 + }, + { + "text": "pas", + "start": 65.54, + "end": 65.66, + "confidence": 0.999 + }, + { + "text": "d'équivalent", + "start": 65.66, + "end": 66.22, + "confidence": 0.995 + }, + { + "text": "en", + "start": 66.22, + "end": 66.42, + "confidence": 0.601 + }, + { + "text": "fait.", + "start": 66.42, + "end": 66.66, + "confidence": 0.996 + } + ] + }, + { + "id": 14, + "seek": 4884, + "start": 66.88, + "end": 71.52, + "text": " Et donc cette espèce de nouveauté dans la relation à l'objet, c'est fascinant et terrifiant.", + "tokens": [ + 3790, + 5926, + 5550, + 7089, + 30236, + 368, + 11456, + 1375, + 526, + 2680, + 635, + 9721, + 1531, + 287, + 6, + 996, + 7108, + 11, + 269, + 6, + 377, + 7184, + 259, + 394, + 1030, + 7245, + 351, + 5798, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.10683460109281225, + "compression_ratio": 1.662379421221865, + "no_speech_prob": 1.2805365258827806e-05, + "confidence": 0.953, + "words": [ + { + "text": "Et", + "start": 66.88, + "end": 66.98, + "confidence": 0.599 + }, + { + "text": "donc", + "start": 66.98, + "end": 67.08, + "confidence": 0.902 + }, + { + "text": "cette", + "start": 67.08, + "end": 67.28, + "confidence": 0.712 + }, + { + "text": "espèce", + "start": 67.28, + "end": 67.54, + "confidence": 0.996 + }, + { + "text": "de", + "start": 67.54, + "end": 67.68, + "confidence": 0.999 + }, + { + "text": "nouveauté", + "start": 67.68, + "end": 68.48, + "confidence": 0.979 + }, + { + "text": "dans", + "start": 68.48, + "end": 68.66, + "confidence": 0.98 + }, + { + "text": "la", + "start": 68.66, + "end": 68.94, + "confidence": 0.995 + }, + { + "text": "relation", + "start": 68.94, + "end": 69.22, + "confidence": 0.998 + }, + { + "text": "à", + "start": 69.22, + "end": 69.38, + "confidence": 0.997 + }, + { + "text": "l'objet,", + "start": 69.38, + "end": 70.24, + "confidence": 0.997 + }, + { + "text": "c'est", + "start": 70.24, + "end": 70.38, + "confidence": 0.98 + }, + { + "text": "fascinant", + "start": 70.38, + "end": 70.64, + "confidence": 0.978 + }, + { + "text": "et", + "start": 70.64, + "end": 70.76, + "confidence": 0.965 + }, + { + "text": "terrifiant.", + "start": 70.76, + "end": 71.52, + "confidence": 0.977 + } + ] + }, + { + "id": 15, + "seek": 4884, + "start": 71.62, + "end": 76.48, + "text": " Parce qu'on a l'impression, comme le disent les utilisateurs et les services, d'être dépendants de cet objet,", + "tokens": [ + 20429, + 421, + 6, + 266, + 257, + 287, + 6, + 36107, + 11, + 5173, + 476, + 37313, + 1512, + 33643, + 25929, + 1030, + 1512, + 3328, + 11, + 274, + 6, + 9498, + 45768, + 1719, + 368, + 8603, + 14964, + 11 + ], + "temperature": 0.0, + "avg_logprob": -0.10683460109281225, + "compression_ratio": 1.662379421221865, + "no_speech_prob": 1.2805365258827806e-05, + "confidence": 0.815, + "words": [ + { + "text": "Parce", + "start": 71.62, + "end": 71.86, + "confidence": 0.514 + }, + { + "text": "qu'on", + "start": 71.86, + "end": 72.12, + "confidence": 0.938 + }, + { + "text": "a", + "start": 72.12, + "end": 72.44, + "confidence": 0.982 + }, + { + "text": "l'impression,", + "start": 72.44, + "end": 73.56, + "confidence": 0.998 + }, + { + "text": "comme", + "start": 73.56, + "end": 73.84, + "confidence": 0.964 + }, + { + "text": "le", + "start": 73.84, + "end": 74.0, + "confidence": 0.984 + }, + { + "text": "disent", + "start": 74.0, + "end": 74.2, + "confidence": 0.998 + }, + { + "text": "les", + "start": 74.2, + "end": 74.4, + "confidence": 0.994 + }, + { + "text": "utilisateurs", + "start": 74.4, + "end": 74.84, + "confidence": 0.997 + }, + { + "text": "et", + "start": 74.84, + "end": 74.96, + "confidence": 0.331 + }, + { + "text": "les", + "start": 74.96, + "end": 75.0, + "confidence": 0.775 + }, + { + "text": "services,", + "start": 75.0, + "end": 75.22, + "confidence": 0.217 + }, + { + "text": "d'être", + "start": 75.22, + "end": 75.42, + "confidence": 0.768 + }, + { + "text": "dépendants", + "start": 75.42, + "end": 75.96, + "confidence": 0.79 + }, + { + "text": "de", + "start": 75.96, + "end": 76.08, + "confidence": 0.985 + }, + { + "text": "cet", + "start": 76.08, + "end": 76.26, + "confidence": 0.996 + }, + { + "text": "objet,", + "start": 76.26, + "end": 76.48, + "confidence": 0.996 + } + ] + }, + { + "id": 16, + "seek": 7684, + "start": 76.86, + "end": 83.26, + "text": " d'induire en fait une espèce de relation, de médiation avec le monde qui rend de l'ampleur et qui amène aussi à des formes de rejet.", + "tokens": [ + 274, + 6, + 471, + 43612, + 465, + 3887, + 2251, + 7089, + 30236, + 368, + 9721, + 11, + 368, + 42436, + 399, + 4163, + 476, + 10431, + 1956, + 6125, + 368, + 287, + 6, + 335, + 781, + 374, + 1030, + 1956, + 669, + 18832, + 6212, + 1531, + 730, + 1254, + 279, + 368, + 319, + 7108, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.06925634075613583, + "compression_ratio": 1.6787003610108304, + "no_speech_prob": 5.771887572336709e-06, + "confidence": 0.917, + "words": [ + { + "text": "d'induire", + "start": 76.86, + "end": 77.08, + "confidence": 0.84 + }, + { + "text": "en", + "start": 77.08, + "end": 77.24, + "confidence": 0.617 + }, + { + "text": "fait", + "start": 77.24, + "end": 77.34, + "confidence": 0.994 + }, + { + "text": "une", + "start": 77.34, + "end": 77.52, + "confidence": 0.983 + }, + { + "text": "espèce", + "start": 77.52, + "end": 77.88, + "confidence": 0.996 + }, + { + "text": "de", + "start": 77.88, + "end": 78.48, + "confidence": 0.997 + }, + { + "text": "relation,", + "start": 78.48, + "end": 78.6, + "confidence": 0.601 + }, + { + "text": "de", + "start": 78.6, + "end": 78.94, + "confidence": 0.987 + }, + { + "text": "médiation", + "start": 78.94, + "end": 79.52, + "confidence": 0.997 + }, + { + "text": "avec", + "start": 79.52, + "end": 79.74, + "confidence": 0.967 + }, + { + "text": "le", + "start": 79.74, + "end": 79.92, + "confidence": 0.998 + }, + { + "text": "monde", + "start": 79.92, + "end": 80.64, + "confidence": 0.992 + }, + { + "text": "qui", + "start": 80.64, + "end": 81.1, + "confidence": 0.695 + }, + { + "text": "rend", + "start": 81.1, + "end": 81.64, + "confidence": 0.907 + }, + { + "text": "de", + "start": 81.64, + "end": 81.78, + "confidence": 0.714 + }, + { + "text": "l'ampleur", + "start": 81.78, + "end": 82.02, + "confidence": 0.987 + }, + { + "text": "et", + "start": 82.02, + "end": 82.12, + "confidence": 0.931 + }, + { + "text": "qui", + "start": 82.12, + "end": 82.24, + "confidence": 0.976 + }, + { + "text": "amène", + "start": 82.24, + "end": 82.36, + "confidence": 0.973 + }, + { + "text": "aussi", + "start": 82.36, + "end": 82.56, + "confidence": 0.939 + }, + { + "text": "à", + "start": 82.56, + "end": 82.64, + "confidence": 0.941 + }, + { + "text": "des", + "start": 82.64, + "end": 82.72, + "confidence": 0.992 + }, + { + "text": "formes", + "start": 82.72, + "end": 82.9, + "confidence": 0.993 + }, + { + "text": "de", + "start": 82.9, + "end": 83.02, + "confidence": 0.997 + }, + { + "text": "rejet.", + "start": 83.02, + "end": 83.26, + "confidence": 0.884 + } + ] + }, + { + "id": 17, + "seek": 7684, + "start": 83.94, + "end": 87.8, + "text": " Donc, à objet inédit, rapport inédit.", + "tokens": [ + 7477, + 11, + 1531, + 14964, + 294, + 7811, + 270, + 11, + 18018, + 294, + 7811, + 270, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.06925634075613583, + "compression_ratio": 1.6787003610108304, + "no_speech_prob": 5.771887572336709e-06, + "confidence": 0.962, + "words": [ + { + "text": "Donc,", + "start": 83.94, + "end": 84.94, + "confidence": 0.971 + }, + { + "text": "à", + "start": 84.94, + "end": 84.98, + "confidence": 0.881 + }, + { + "text": "objet", + "start": 84.98, + "end": 85.36, + "confidence": 0.827 + }, + { + "text": "inédit,", + "start": 85.36, + "end": 86.56, + "confidence": 0.993 + }, + { + "text": "rapport", + "start": 86.56, + "end": 87.0, + "confidence": 0.981 + }, + { + "text": "inédit.", + "start": 87.0, + "end": 87.8, + "confidence": 0.998 + } + ] + }, + { + "id": 18, + "seek": 7684, + "start": 88.02, + "end": 95.14, + "text": " Et ce rapport, si j'en crois Nicolas, serait caractérisé par un mélange de dépendance et de rejet.", + "tokens": [ + 3790, + 1769, + 18018, + 11, + 1511, + 361, + 6, + 268, + 21724, + 38268, + 11, + 23139, + 1032, + 578, + 4198, + 22118, + 971, + 517, + 41953, + 933, + 368, + 45768, + 719, + 1030, + 368, + 319, + 7108, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.06925634075613583, + "compression_ratio": 1.6787003610108304, + "no_speech_prob": 5.771887572336709e-06, + "confidence": 0.972, + "words": [ + { + "text": "Et", + "start": 88.02, + "end": 88.48, + "confidence": 0.992 + }, + { + "text": "ce", + "start": 88.48, + "end": 88.86, + "confidence": 0.975 + }, + { + "text": "rapport,", + "start": 88.86, + "end": 89.28, + "confidence": 0.998 + }, + { + "text": "si", + "start": 89.28, + "end": 89.56, + "confidence": 0.999 + }, + { + "text": "j'en", + "start": 89.56, + "end": 89.84, + "confidence": 0.996 + }, + { + "text": "crois", + "start": 89.84, + "end": 89.88, + "confidence": 0.984 + }, + { + "text": "Nicolas,", + "start": 89.88, + "end": 90.54, + "confidence": 0.683 + }, + { + "text": "serait", + "start": 90.54, + "end": 90.94, + "confidence": 0.887 + }, + { + "text": "caractérisé", + "start": 90.94, + "end": 91.8, + "confidence": 0.993 + }, + { + "text": "par", + "start": 91.8, + "end": 92.12, + "confidence": 0.997 + }, + { + "text": "un", + "start": 92.12, + "end": 92.44, + "confidence": 0.997 + }, + { + "text": "mélange", + "start": 92.44, + "end": 92.98, + "confidence": 0.999 + }, + { + "text": "de", + "start": 92.98, + "end": 93.4, + "confidence": 0.998 + }, + { + "text": "dépendance", + "start": 93.4, + "end": 94.24, + "confidence": 0.952 + }, + { + "text": "et", + "start": 94.24, + "end": 94.54, + "confidence": 0.998 + }, + { + "text": "de", + "start": 94.54, + "end": 94.68, + "confidence": 0.999 + }, + { + "text": "rejet.", + "start": 94.68, + "end": 95.14, + "confidence": 0.993 + } + ] + }, + { + "id": 19, + "seek": 7684, + "start": 95.78, + "end": 102.86, + "text": " Bon, en vrai, il faudrait remonter très très finement toute l'histoire des objets techniques et de leur insertion dans nos vies", + "tokens": [ + 7368, + 11, + 465, + 17815, + 11, + 1930, + 38694, + 8645, + 890, + 41806, + 5732, + 5732, + 962, + 1712, + 14953, + 287, + 6, + 29093, + 730, + 1111, + 25349, + 7512, + 1030, + 368, + 9580, + 8969, + 313, + 2680, + 3269, + 371, + 530 + ], + "temperature": 0.0, + "avg_logprob": -0.06925634075613583, + "compression_ratio": 1.6787003610108304, + "no_speech_prob": 5.771887572336709e-06, + "confidence": 0.941, + "words": [ + { + "text": "Bon,", + "start": 95.78, + "end": 96.38, + "confidence": 0.793 + }, + { + "text": "en", + "start": 96.38, + "end": 96.52, + "confidence": 0.998 + }, + { + "text": "vrai,", + "start": 96.52, + "end": 97.14, + "confidence": 0.994 + }, + { + "text": "il", + "start": 97.14, + "end": 97.18, + "confidence": 0.998 + }, + { + "text": "faudrait", + "start": 97.18, + "end": 97.58, + "confidence": 0.997 + }, + { + "text": "remonter", + "start": 97.58, + "end": 98.08, + "confidence": 0.997 + }, + { + "text": "très", + "start": 98.08, + "end": 98.58, + "confidence": 0.997 + }, + { + "text": "très", + "start": 98.58, + "end": 98.7, + "confidence": 0.767 + }, + { + "text": "finement", + "start": 98.7, + "end": 99.32, + "confidence": 0.849 + }, + { + "text": "toute", + "start": 99.32, + "end": 99.7, + "confidence": 0.984 + }, + { + "text": "l'histoire", + "start": 99.7, + "end": 100.06, + "confidence": 0.997 + }, + { + "text": "des", + "start": 100.06, + "end": 100.24, + "confidence": 0.998 + }, + { + "text": "objets", + "start": 100.24, + "end": 100.48, + "confidence": 0.999 + }, + { + "text": "techniques", + "start": 100.48, + "end": 101.02, + "confidence": 0.984 + }, + { + "text": "et", + "start": 101.02, + "end": 101.48, + "confidence": 0.531 + }, + { + "text": "de", + "start": 101.48, + "end": 101.68, + "confidence": 0.994 + }, + { + "text": "leur", + "start": 101.68, + "end": 101.84, + "confidence": 0.829 + }, + { + "text": "insertion", + "start": 101.84, + "end": 102.32, + "confidence": 0.994 + }, + { + "text": "dans", + "start": 102.32, + "end": 102.48, + "confidence": 0.991 + }, + { + "text": "nos", + "start": 102.48, + "end": 102.66, + "confidence": 0.998 + }, + { + "text": "vies", + "start": 102.66, + "end": 102.86, + "confidence": 0.998 + } + ] + }, + { + "id": 20, + "seek": 7684, + "start": 102.9, + "end": 105.74, + "text": " pour déterminer si ce rapport est totalement inédit.", + "tokens": [ + 2016, + 2795, + 29725, + 260, + 1511, + 1769, + 18018, + 871, + 45203, + 294, + 7811, + 270, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.06925634075613583, + "compression_ratio": 1.6787003610108304, + "no_speech_prob": 5.771887572336709e-06, + "confidence": 0.981, + "words": [ + { + "text": "pour", + "start": 102.9, + "end": 103.06, + "confidence": 0.819 + }, + { + "text": "déterminer", + "start": 103.06, + "end": 103.66, + "confidence": 0.997 + }, + { + "text": "si", + "start": 103.66, + "end": 103.76, + "confidence": 0.992 + }, + { + "text": "ce", + "start": 103.76, + "end": 103.94, + "confidence": 0.997 + }, + { + "text": "rapport", + "start": 103.94, + "end": 104.26, + "confidence": 0.997 + }, + { + "text": "est", + "start": 104.26, + "end": 104.74, + "confidence": 0.998 + }, + { + "text": "totalement", + "start": 104.74, + "end": 105.3, + "confidence": 0.999 + }, + { + "text": "inédit.", + "start": 105.3, + "end": 105.74, + "confidence": 0.999 + } + ] + }, + { + "id": 21, + "seek": 10584, + "start": 106.1, + "end": 109.34, + "text": " Mais j'ai l'impression comme ça que Nicolas ne se trompe pas vraiment.", + "tokens": [ + 6313, + 361, + 6, + 1301, + 287, + 6, + 36107, + 5173, + 2788, + 631, + 38268, + 408, + 369, + 504, + 298, + 494, + 1736, + 8322, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.07393737035254909, + "compression_ratio": 1.685512367491166, + "no_speech_prob": 5.3074043535161763e-05, + "confidence": 0.94, + "words": [ + { + "text": "Mais", + "start": 106.1, + "end": 106.36, + "confidence": 0.947 + }, + { + "text": "j'ai", + "start": 106.36, + "end": 106.92, + "confidence": 0.94 + }, + { + "text": "l'impression", + "start": 106.92, + "end": 107.36, + "confidence": 0.996 + }, + { + "text": "comme", + "start": 107.36, + "end": 107.56, + "confidence": 0.642 + }, + { + "text": "ça", + "start": 107.56, + "end": 107.82, + "confidence": 0.978 + }, + { + "text": "que", + "start": 107.82, + "end": 107.96, + "confidence": 0.976 + }, + { + "text": "Nicolas", + "start": 107.96, + "end": 108.46, + "confidence": 0.985 + }, + { + "text": "ne", + "start": 108.46, + "end": 108.66, + "confidence": 0.726 + }, + { + "text": "se", + "start": 108.66, + "end": 108.7, + "confidence": 0.991 + }, + { + "text": "trompe", + "start": 108.7, + "end": 108.88, + "confidence": 0.995 + }, + { + "text": "pas", + "start": 108.88, + "end": 109.08, + "confidence": 0.999 + }, + { + "text": "vraiment.", + "start": 109.08, + "end": 109.34, + "confidence": 0.991 + } + ] + }, + { + "id": 22, + "seek": 10584, + "start": 109.88, + "end": 114.98, + "text": " Pour autant que je sache, il y a eu plein de discussions autour de la voiture ou même du téléphone.", + "tokens": [ + 8732, + 34081, + 631, + 1506, + 262, + 6000, + 11, + 1930, + 288, + 257, + 2228, + 21088, + 368, + 11088, + 30249, + 368, + 635, + 38859, + 2820, + 5698, + 1581, + 47159, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.07393737035254909, + "compression_ratio": 1.685512367491166, + "no_speech_prob": 5.3074043535161763e-05, + "confidence": 0.969, + "words": [ + { + "text": "Pour", + "start": 109.88, + "end": 110.08, + "confidence": 0.997 + }, + { + "text": "autant", + "start": 110.08, + "end": 110.24, + "confidence": 1.0 + }, + { + "text": "que", + "start": 110.24, + "end": 110.42, + "confidence": 0.988 + }, + { + "text": "je", + "start": 110.42, + "end": 110.52, + "confidence": 0.998 + }, + { + "text": "sache,", + "start": 110.52, + "end": 111.14, + "confidence": 0.962 + }, + { + "text": "il", + "start": 111.14, + "end": 111.18, + "confidence": 0.997 + }, + { + "text": "y", + "start": 111.18, + "end": 111.32, + "confidence": 0.992 + }, + { + "text": "a", + "start": 111.32, + "end": 111.36, + "confidence": 0.993 + }, + { + "text": "eu", + "start": 111.36, + "end": 111.68, + "confidence": 0.998 + }, + { + "text": "plein", + "start": 111.68, + "end": 111.88, + "confidence": 0.974 + }, + { + "text": "de", + "start": 111.88, + "end": 112.06, + "confidence": 0.997 + }, + { + "text": "discussions", + "start": 112.06, + "end": 112.6, + "confidence": 0.799 + }, + { + "text": "autour", + "start": 112.6, + "end": 112.94, + "confidence": 0.995 + }, + { + "text": "de", + "start": 112.94, + "end": 113.46, + "confidence": 0.997 + }, + { + "text": "la", + "start": 113.46, + "end": 113.52, + "confidence": 0.998 + }, + { + "text": "voiture", + "start": 113.52, + "end": 113.86, + "confidence": 1.0 + }, + { + "text": "ou", + "start": 113.86, + "end": 114.06, + "confidence": 0.765 + }, + { + "text": "même", + "start": 114.06, + "end": 114.44, + "confidence": 0.996 + }, + { + "text": "du", + "start": 114.44, + "end": 114.6, + "confidence": 0.995 + }, + { + "text": "téléphone.", + "start": 114.6, + "end": 114.98, + "confidence": 0.999 + } + ] + }, + { + "id": 23, + "seek": 10584, + "start": 115.34, + "end": 119.84, + "text": " Mais la dépendance n'était pas du même ordre. Donc le rejet non plus n'était pas du même ordre.", + "tokens": [ + 6313, + 635, + 45768, + 719, + 297, + 6, + 9743, + 1736, + 1581, + 5698, + 4792, + 265, + 13, + 7477, + 476, + 319, + 7108, + 2107, + 1804, + 297, + 6, + 9743, + 1736, + 1581, + 5698, + 4792, + 265, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.07393737035254909, + "compression_ratio": 1.685512367491166, + "no_speech_prob": 5.3074043535161763e-05, + "confidence": 0.972, + "words": [ + { + "text": "Mais", + "start": 115.34, + "end": 115.72, + "confidence": 0.994 + }, + { + "text": "la", + "start": 115.72, + "end": 116.02, + "confidence": 0.936 + }, + { + "text": "dépendance", + "start": 116.02, + "end": 116.4, + "confidence": 0.997 + }, + { + "text": "n'était", + "start": 116.4, + "end": 116.62, + "confidence": 0.994 + }, + { + "text": "pas", + "start": 116.62, + "end": 117.0, + "confidence": 0.998 + }, + { + "text": "du", + "start": 117.0, + "end": 117.16, + "confidence": 0.995 + }, + { + "text": "même", + "start": 117.16, + "end": 117.46, + "confidence": 0.999 + }, + { + "text": "ordre.", + "start": 117.46, + "end": 117.78, + "confidence": 0.999 + }, + { + "text": "Donc", + "start": 117.78, + "end": 117.98, + "confidence": 0.806 + }, + { + "text": "le", + "start": 117.98, + "end": 118.34, + "confidence": 0.709 + }, + { + "text": "rejet", + "start": 118.34, + "end": 118.62, + "confidence": 0.999 + }, + { + "text": "non", + "start": 118.62, + "end": 118.78, + "confidence": 0.974 + }, + { + "text": "plus", + "start": 118.78, + "end": 118.94, + "confidence": 0.995 + }, + { + "text": "n'était", + "start": 118.94, + "end": 119.12, + "confidence": 0.987 + }, + { + "text": "pas", + "start": 119.12, + "end": 119.3, + "confidence": 0.998 + }, + { + "text": "du", + "start": 119.3, + "end": 119.38, + "confidence": 0.995 + }, + { + "text": "même", + "start": 119.38, + "end": 119.56, + "confidence": 0.999 + }, + { + "text": "ordre.", + "start": 119.56, + "end": 119.84, + "confidence": 0.999 + } + ] + }, + { + "id": 24, + "seek": 10584, + "start": 119.98, + "end": 123.02, + "text": " On peut adorer sa bagnole, en avoir besoin pour plein de choses.", + "tokens": [ + 1282, + 5977, + 614, + 17618, + 601, + 3411, + 1771, + 306, + 11, + 465, + 10853, + 19207, + 2016, + 21088, + 368, + 14488, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.07393737035254909, + "compression_ratio": 1.685512367491166, + "no_speech_prob": 5.3074043535161763e-05, + "confidence": 0.991, + "words": [ + { + "text": "On", + "start": 119.98, + "end": 120.18, + "confidence": 0.996 + }, + { + "text": "peut", + "start": 120.18, + "end": 120.38, + "confidence": 0.997 + }, + { + "text": "adorer", + "start": 120.38, + "end": 120.66, + "confidence": 0.99 + }, + { + "text": "sa", + "start": 120.66, + "end": 120.88, + "confidence": 0.985 + }, + { + "text": "bagnole,", + "start": 120.88, + "end": 121.46, + "confidence": 0.984 + }, + { + "text": "en", + "start": 121.46, + "end": 121.56, + "confidence": 0.989 + }, + { + "text": "avoir", + "start": 121.56, + "end": 121.74, + "confidence": 0.998 + }, + { + "text": "besoin", + "start": 121.74, + "end": 122.1, + "confidence": 0.999 + }, + { + "text": "pour", + "start": 122.1, + "end": 122.34, + "confidence": 0.987 + }, + { + "text": "plein", + "start": 122.34, + "end": 122.68, + "confidence": 0.989 + }, + { + "text": "de", + "start": 122.68, + "end": 122.8, + "confidence": 0.998 + }, + { + "text": "choses.", + "start": 122.8, + "end": 123.02, + "confidence": 0.989 + } + ] + }, + { + "id": 25, + "seek": 10584, + "start": 123.28, + "end": 126.36, + "text": " Et bien, le soir, quand on va se coucher, on la laisse.", + "tokens": [ + 3790, + 3610, + 11, + 476, + 27105, + 11, + 6932, + 322, + 2773, + 369, + 1384, + 6759, + 11, + 322, + 635, + 30969, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.07393737035254909, + "compression_ratio": 1.685512367491166, + "no_speech_prob": 5.3074043535161763e-05, + "confidence": 0.895, + "words": [ + { + "text": "Et", + "start": 123.28, + "end": 123.46, + "confidence": 0.666 + }, + { + "text": "bien,", + "start": 123.46, + "end": 123.86, + "confidence": 0.47 + }, + { + "text": "le", + "start": 123.86, + "end": 123.98, + "confidence": 0.996 + }, + { + "text": "soir,", + "start": 123.98, + "end": 124.68, + "confidence": 0.999 + }, + { + "text": "quand", + "start": 124.68, + "end": 124.9, + "confidence": 0.997 + }, + { + "text": "on", + "start": 124.9, + "end": 125.02, + "confidence": 0.998 + }, + { + "text": "va", + "start": 125.02, + "end": 125.14, + "confidence": 0.996 + }, + { + "text": "se", + "start": 125.14, + "end": 125.38, + "confidence": 0.988 + }, + { + "text": "coucher,", + "start": 125.38, + "end": 125.8, + "confidence": 0.987 + }, + { + "text": "on", + "start": 125.8, + "end": 126.02, + "confidence": 0.995 + }, + { + "text": "la", + "start": 126.02, + "end": 126.22, + "confidence": 0.801 + }, + { + "text": "laisse.", + "start": 126.22, + "end": 126.36, + "confidence": 0.999 + } + ] + }, + { + "id": 26, + "seek": 10584, + "start": 126.98, + "end": 130.48, + "text": " On ne l'a pas dans la main quand on est au lit, on ne l'emmène pas au chiottes.", + "tokens": [ + 1282, + 408, + 287, + 6, + 64, + 1736, + 2680, + 635, + 2135, + 6932, + 322, + 871, + 1609, + 7997, + 11, + 322, + 408, + 287, + 6, + 443, + 76, + 18832, + 1736, + 1609, + 13228, + 1521, + 279, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.07393737035254909, + "compression_ratio": 1.685512367491166, + "no_speech_prob": 5.3074043535161763e-05, + "confidence": 0.914, + "words": [ + { + "text": "On", + "start": 126.98, + "end": 127.32, + "confidence": 0.954 + }, + { + "text": "ne", + "start": 127.32, + "end": 127.36, + "confidence": 0.802 + }, + { + "text": "l'a", + "start": 127.36, + "end": 127.48, + "confidence": 0.974 + }, + { + "text": "pas", + "start": 127.48, + "end": 127.68, + "confidence": 0.999 + }, + { + "text": "dans", + "start": 127.68, + "end": 127.8, + "confidence": 0.996 + }, + { + "text": "la", + "start": 127.8, + "end": 128.06, + "confidence": 0.994 + }, + { + "text": "main", + "start": 128.06, + "end": 128.26, + "confidence": 0.999 + }, + { + "text": "quand", + "start": 128.26, + "end": 128.44, + "confidence": 0.934 + }, + { + "text": "on", + "start": 128.44, + "end": 128.62, + "confidence": 0.997 + }, + { + "text": "est", + "start": 128.62, + "end": 128.68, + "confidence": 0.993 + }, + { + "text": "au", + "start": 128.68, + "end": 129.04, + "confidence": 0.984 + }, + { + "text": "lit,", + "start": 129.04, + "end": 129.14, + "confidence": 0.999 + }, + { + "text": "on", + "start": 129.14, + "end": 129.26, + "confidence": 0.427 + }, + { + "text": "ne", + "start": 129.26, + "end": 129.3, + "confidence": 0.963 + }, + { + "text": "l'emmène", + "start": 129.3, + "end": 129.5, + "confidence": 0.992 + }, + { + "text": "pas", + "start": 129.5, + "end": 129.68, + "confidence": 0.997 + }, + { + "text": "au", + "start": 129.68, + "end": 129.86, + "confidence": 0.668 + }, + { + "text": "chiottes.", + "start": 129.86, + "end": 130.48, + "confidence": 0.829 + } + ] + }, + { + "id": 27, + "seek": 13084, + "start": 130.86, + "end": 136.9, + "text": " On pouvait être énervé par son môme qui occupait la ligne de téléphone pendant une heure chaque soir pour discuter avec un copain.", + "tokens": [ + 1282, + 45913, + 7418, + 45045, + 15797, + 971, + 1872, + 275, + 2851, + 1398, + 1956, + 8073, + 1001, + 635, + 34207, + 368, + 47159, + 17338, + 2251, + 30027, + 18920, + 27105, + 2016, + 2983, + 20314, + 4163, + 517, + 2971, + 491, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.06175626696962299, + "compression_ratio": 1.6127167630057804, + "no_speech_prob": 1.5689402061980218e-05, + "confidence": 0.955, + "words": [ + { + "text": "On", + "start": 130.86, + "end": 131.04, + "confidence": 0.983 + }, + { + "text": "pouvait", + "start": 131.04, + "end": 131.28, + "confidence": 0.989 + }, + { + "text": "être", + "start": 131.28, + "end": 131.48, + "confidence": 0.996 + }, + { + "text": "énervé", + "start": 131.48, + "end": 132.22, + "confidence": 0.906 + }, + { + "text": "par", + "start": 132.22, + "end": 132.44, + "confidence": 0.991 + }, + { + "text": "son", + "start": 132.44, + "end": 132.7, + "confidence": 0.998 + }, + { + "text": "môme", + "start": 132.7, + "end": 133.1, + "confidence": 0.832 + }, + { + "text": "qui", + "start": 133.1, + "end": 133.34, + "confidence": 0.919 + }, + { + "text": "occupait", + "start": 133.34, + "end": 133.76, + "confidence": 0.991 + }, + { + "text": "la", + "start": 133.76, + "end": 133.8, + "confidence": 0.992 + }, + { + "text": "ligne", + "start": 133.8, + "end": 134.08, + "confidence": 0.999 + }, + { + "text": "de", + "start": 134.08, + "end": 134.14, + "confidence": 0.997 + }, + { + "text": "téléphone", + "start": 134.14, + "end": 134.6, + "confidence": 0.985 + }, + { + "text": "pendant", + "start": 134.6, + "end": 134.82, + "confidence": 0.98 + }, + { + "text": "une", + "start": 134.82, + "end": 135.2, + "confidence": 0.87 + }, + { + "text": "heure", + "start": 135.2, + "end": 135.36, + "confidence": 0.998 + }, + { + "text": "chaque", + "start": 135.36, + "end": 135.54, + "confidence": 0.991 + }, + { + "text": "soir", + "start": 135.54, + "end": 135.8, + "confidence": 0.996 + }, + { + "text": "pour", + "start": 135.8, + "end": 135.96, + "confidence": 0.791 + }, + { + "text": "discuter", + "start": 135.96, + "end": 136.28, + "confidence": 0.997 + }, + { + "text": "avec", + "start": 136.28, + "end": 136.48, + "confidence": 0.996 + }, + { + "text": "un", + "start": 136.48, + "end": 136.6, + "confidence": 0.999 + }, + { + "text": "copain.", + "start": 136.6, + "end": 136.9, + "confidence": 0.998 + } + ] + }, + { + "id": 28, + "seek": 13084, + "start": 137.28, + "end": 141.88, + "text": " Mais ça ne ressemblait pas à ce qu'on peut ressentir à voir ce même môme aujourd'hui,", + "tokens": [ + 6313, + 2788, + 408, + 725, + 15750, + 35235, + 1736, + 1531, + 1769, + 421, + 6, + 266, + 5977, + 24689, + 317, + 347, + 1531, + 10695, + 1769, + 5698, + 275, + 2851, + 1398, + 14023, + 6, + 10556, + 11 + ], + "temperature": 0.0, + "avg_logprob": -0.06175626696962299, + "compression_ratio": 1.6127167630057804, + "no_speech_prob": 1.5689402061980218e-05, + "confidence": 0.958, + "words": [ + { + "text": "Mais", + "start": 137.28, + "end": 137.46, + "confidence": 0.993 + }, + { + "text": "ça", + "start": 137.46, + "end": 137.68, + "confidence": 0.938 + }, + { + "text": "ne", + "start": 137.68, + "end": 137.94, + "confidence": 0.998 + }, + { + "text": "ressemblait", + "start": 137.94, + "end": 138.4, + "confidence": 0.991 + }, + { + "text": "pas", + "start": 138.4, + "end": 138.76, + "confidence": 0.995 + }, + { + "text": "à", + "start": 138.76, + "end": 138.94, + "confidence": 0.988 + }, + { + "text": "ce", + "start": 138.94, + "end": 138.98, + "confidence": 0.998 + }, + { + "text": "qu'on", + "start": 138.98, + "end": 139.1, + "confidence": 0.986 + }, + { + "text": "peut", + "start": 139.1, + "end": 139.48, + "confidence": 0.988 + }, + { + "text": "ressentir", + "start": 139.48, + "end": 140.12, + "confidence": 0.997 + }, + { + "text": "à", + "start": 140.12, + "end": 140.32, + "confidence": 0.498 + }, + { + "text": "voir", + "start": 140.32, + "end": 140.46, + "confidence": 0.852 + }, + { + "text": "ce", + "start": 140.46, + "end": 140.68, + "confidence": 0.989 + }, + { + "text": "même", + "start": 140.68, + "end": 140.92, + "confidence": 0.984 + }, + { + "text": "môme", + "start": 140.92, + "end": 141.34, + "confidence": 0.998 + }, + { + "text": "aujourd'hui,", + "start": 141.34, + "end": 141.88, + "confidence": 0.988 + } + ] + }, + { + "id": 29, + "seek": 13084, + "start": 142.14, + "end": 146.3, + "text": " continuellement avec son smartphone dans la main, comme si c'était une sorte de pacemaker externe,", + "tokens": [ + 2354, + 285, + 1712, + 4163, + 1872, + 13307, + 2680, + 635, + 2135, + 11, + 5173, + 1511, + 269, + 6, + 9743, + 2251, + 25559, + 368, + 15165, + 49523, + 454, + 391, + 716, + 11 + ], + "temperature": 0.0, + "avg_logprob": -0.06175626696962299, + "compression_ratio": 1.6127167630057804, + "no_speech_prob": 1.5689402061980218e-05, + "confidence": 0.963, + "words": [ + { + "text": "continuellement", + "start": 142.14, + "end": 142.94, + "confidence": 0.971 + }, + { + "text": "avec", + "start": 142.94, + "end": 143.18, + "confidence": 0.806 + }, + { + "text": "son", + "start": 143.18, + "end": 143.38, + "confidence": 0.995 + }, + { + "text": "smartphone", + "start": 143.38, + "end": 143.76, + "confidence": 0.978 + }, + { + "text": "dans", + "start": 143.76, + "end": 143.94, + "confidence": 0.979 + }, + { + "text": "la", + "start": 143.94, + "end": 144.0, + "confidence": 0.996 + }, + { + "text": "main,", + "start": 144.0, + "end": 144.36, + "confidence": 0.998 + }, + { + "text": "comme", + "start": 144.36, + "end": 144.52, + "confidence": 0.836 + }, + { + "text": "si", + "start": 144.52, + "end": 144.64, + "confidence": 0.975 + }, + { + "text": "c'était", + "start": 144.64, + "end": 144.82, + "confidence": 0.991 + }, + { + "text": "une", + "start": 144.82, + "end": 145.06, + "confidence": 0.989 + }, + { + "text": "sorte", + "start": 145.06, + "end": 145.22, + "confidence": 0.997 + }, + { + "text": "de", + "start": 145.22, + "end": 145.3, + "confidence": 0.982 + }, + { + "text": "pacemaker", + "start": 145.3, + "end": 145.82, + "confidence": 0.917 + }, + { + "text": "externe,", + "start": 145.82, + "end": 146.3, + "confidence": 0.992 + } + ] + }, + { + "id": 30, + "seek": 13084, + "start": 146.34, + "end": 148.84, + "text": " comme si le lâcher allait entraîner sa mort immédiate.", + "tokens": [ + 5173, + 1511, + 476, + 48835, + 6759, + 439, + 1001, + 22284, + 7517, + 1193, + 601, + 6599, + 3397, + 526, + 4504, + 473, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.06175626696962299, + "compression_ratio": 1.6127167630057804, + "no_speech_prob": 1.5689402061980218e-05, + "confidence": 0.989, + "words": [ + { + "text": "comme", + "start": 146.34, + "end": 146.58, + "confidence": 0.996 + }, + { + "text": "si", + "start": 146.58, + "end": 146.76, + "confidence": 0.994 + }, + { + "text": "le", + "start": 146.76, + "end": 146.86, + "confidence": 0.997 + }, + { + "text": "lâcher", + "start": 146.86, + "end": 147.36, + "confidence": 0.969 + }, + { + "text": "allait", + "start": 147.36, + "end": 147.56, + "confidence": 0.993 + }, + { + "text": "entraîner", + "start": 147.56, + "end": 147.86, + "confidence": 0.978 + }, + { + "text": "sa", + "start": 147.86, + "end": 148.0, + "confidence": 0.999 + }, + { + "text": "mort", + "start": 148.0, + "end": 148.22, + "confidence": 0.998 + }, + { + "text": "immédiate.", + "start": 148.22, + "end": 148.84, + "confidence": 0.997 + } + ] + }, + { + "id": 31, + "seek": 13084, + "start": 149.04, + "end": 151.96, + "text": " Bon, je dis ça pour le môme, mais c'est évidemment valable pour nous aussi.", + "tokens": [ + 7368, + 11, + 1506, + 717, + 2788, + 2016, + 476, + 275, + 2851, + 1398, + 11, + 2420, + 269, + 6, + 377, + 24724, + 1323, + 712, + 2016, + 4666, + 6212, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.06175626696962299, + "compression_ratio": 1.6127167630057804, + "no_speech_prob": 1.5689402061980218e-05, + "confidence": 0.974, + "words": [ + { + "text": "Bon,", + "start": 149.04, + "end": 149.28, + "confidence": 0.917 + }, + { + "text": "je", + "start": 149.28, + "end": 149.32, + "confidence": 0.935 + }, + { + "text": "dis", + "start": 149.32, + "end": 149.46, + "confidence": 0.988 + }, + { + "text": "ça", + "start": 149.46, + "end": 149.64, + "confidence": 0.994 + }, + { + "text": "pour", + "start": 149.64, + "end": 149.74, + "confidence": 0.997 + }, + { + "text": "le", + "start": 149.74, + "end": 149.88, + "confidence": 0.995 + }, + { + "text": "môme,", + "start": 149.88, + "end": 150.32, + "confidence": 0.998 + }, + { + "text": "mais", + "start": 150.32, + "end": 150.52, + "confidence": 0.793 + }, + { + "text": "c'est", + "start": 150.52, + "end": 150.82, + "confidence": 0.982 + }, + { + "text": "évidemment", + "start": 150.82, + "end": 151.14, + "confidence": 0.98 + }, + { + "text": "valable", + "start": 151.14, + "end": 151.48, + "confidence": 0.998 + }, + { + "text": "pour", + "start": 151.48, + "end": 151.62, + "confidence": 0.997 + }, + { + "text": "nous", + "start": 151.62, + "end": 151.76, + "confidence": 0.999 + }, + { + "text": "aussi.", + "start": 151.76, + "end": 151.96, + "confidence": 0.996 + } + ] + }, + { + "id": 32, + "seek": 13084, + "start": 152.34, + "end": 158.22, + "text": " Donc, rapport inédit. D'accord. Mais pourquoi a-t-on l'impression qu'on n'en sortira jamais?", + "tokens": [ + 7477, + 11, + 18018, + 294, + 7811, + 270, + 13, + 413, + 6, + 19947, + 13, + 6313, + 19934, + 257, + 12, + 83, + 12, + 266, + 287, + 6, + 36107, + 421, + 6, + 266, + 297, + 6, + 268, + 1333, + 4271, + 14540, + 2506 + ], + "temperature": 0.0, + "avg_logprob": -0.06175626696962299, + "compression_ratio": 1.6127167630057804, + "no_speech_prob": 1.5689402061980218e-05, + "confidence": 0.948, + "words": [ + { + "text": "Donc,", + "start": 152.34, + "end": 153.46, + "confidence": 0.991 + }, + { + "text": "rapport", + "start": 153.46, + "end": 153.66, + "confidence": 0.977 + }, + { + "text": "inédit.", + "start": 153.66, + "end": 154.24, + "confidence": 0.997 + }, + { + "text": "D'accord.", + "start": 154.24, + "end": 155.48, + "confidence": 0.979 + }, + { + "text": "Mais", + "start": 155.48, + "end": 155.82, + "confidence": 0.56 + }, + { + "text": "pourquoi", + "start": 155.82, + "end": 156.32, + "confidence": 0.994 + }, + { + "text": "a-t-on", + "start": 156.32, + "end": 156.68, + "confidence": 0.94 + }, + { + "text": "l'impression", + "start": 156.68, + "end": 157.06, + "confidence": 0.999 + }, + { + "text": "qu'on", + "start": 157.06, + "end": 157.26, + "confidence": 0.995 + }, + { + "text": "n'en", + "start": 157.26, + "end": 157.44, + "confidence": 0.878 + }, + { + "text": "sortira", + "start": 157.44, + "end": 157.9, + "confidence": 0.989 + }, + { + "text": "jamais?", + "start": 157.9, + "end": 158.22, + "confidence": 0.997 + } + ] + }, + { + "id": 33, + "seek": 15884, + "start": 158.86, + "end": 165.32, + "text": " Est-ce qu'il faut en remettre la faute sur les gens qui ont créé cet outil merveilleux et diabolique, et diabolique parce que merveilleux?", + "tokens": [ + 4410, + 12, + 384, + 421, + 6, + 388, + 8487, + 465, + 890, + 40681, + 635, + 2050, + 1169, + 1022, + 1512, + 10668, + 1956, + 6592, + 15609, + 526, + 8603, + 484, + 388, + 3551, + 303, + 3409, + 2449, + 1030, + 1026, + 14923, + 1925, + 11, + 1030, + 1026, + 14923, + 1925, + 6992, + 631, + 3551, + 303, + 3409, + 2449, + 2506 + ], + "temperature": 0.0, + "avg_logprob": -0.07952147990733653, + "compression_ratio": 1.6517857142857142, + "no_speech_prob": 5.475811485666782e-05, + "confidence": 0.962, + "words": [ + { + "text": "Est-ce", + "start": 158.86, + "end": 159.34, + "confidence": 0.981 + }, + { + "text": "qu'il", + "start": 159.34, + "end": 159.46, + "confidence": 0.997 + }, + { + "text": "faut", + "start": 159.46, + "end": 159.62, + "confidence": 0.999 + }, + { + "text": "en", + "start": 159.62, + "end": 159.78, + "confidence": 0.97 + }, + { + "text": "remettre", + "start": 159.78, + "end": 160.12, + "confidence": 0.999 + }, + { + "text": "la", + "start": 160.12, + "end": 160.34, + "confidence": 0.998 + }, + { + "text": "faute", + "start": 160.34, + "end": 160.66, + "confidence": 0.986 + }, + { + "text": "sur", + "start": 160.66, + "end": 160.94, + "confidence": 0.995 + }, + { + "text": "les", + "start": 160.94, + "end": 161.28, + "confidence": 0.995 + }, + { + "text": "gens", + "start": 161.28, + "end": 161.44, + "confidence": 1.0 + }, + { + "text": "qui", + "start": 161.44, + "end": 161.58, + "confidence": 0.984 + }, + { + "text": "ont", + "start": 161.58, + "end": 161.72, + "confidence": 0.998 + }, + { + "text": "créé", + "start": 161.72, + "end": 162.3, + "confidence": 0.99 + }, + { + "text": "cet", + "start": 162.3, + "end": 162.46, + "confidence": 0.852 + }, + { + "text": "outil", + "start": 162.46, + "end": 162.78, + "confidence": 0.99 + }, + { + "text": "merveilleux", + "start": 162.78, + "end": 163.34, + "confidence": 0.994 + }, + { + "text": "et", + "start": 163.34, + "end": 163.5, + "confidence": 0.954 + }, + { + "text": "diabolique,", + "start": 163.5, + "end": 163.86, + "confidence": 0.992 + }, + { + "text": "et", + "start": 163.86, + "end": 163.92, + "confidence": 0.539 + }, + { + "text": "diabolique", + "start": 163.92, + "end": 164.4, + "confidence": 0.951 + }, + { + "text": "parce", + "start": 164.4, + "end": 164.66, + "confidence": 0.704 + }, + { + "text": "que", + "start": 164.66, + "end": 164.84, + "confidence": 0.99 + }, + { + "text": "merveilleux?", + "start": 164.84, + "end": 165.32, + "confidence": 0.997 + } + ] + }, + { + "id": 34, + "seek": 15884, + "start": 166.34, + "end": 168.82, + "text": " Les économistes parlent de dépendance du sentier.", + "tokens": [ + 6965, + 31171, + 22368, + 13734, + 317, + 368, + 45768, + 719, + 1581, + 2279, + 811, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.07952147990733653, + "compression_ratio": 1.6517857142857142, + "no_speech_prob": 5.475811485666782e-05, + "confidence": 0.984, + "words": [ + { + "text": "Les", + "start": 166.34, + "end": 167.04, + "confidence": 0.925 + }, + { + "text": "économistes", + "start": 167.04, + "end": 167.48, + "confidence": 0.998 + }, + { + "text": "parlent", + "start": 167.48, + "end": 167.68, + "confidence": 0.995 + }, + { + "text": "de", + "start": 167.68, + "end": 167.82, + "confidence": 0.995 + }, + { + "text": "dépendance", + "start": 167.82, + "end": 168.36, + "confidence": 0.985 + }, + { + "text": "du", + "start": 168.36, + "end": 168.5, + "confidence": 0.997 + }, + { + "text": "sentier.", + "start": 168.5, + "end": 168.82, + "confidence": 0.978 + } + ] + }, + { + "id": 35, + "seek": 16884, + "start": 168.86, + "end": 177.42, + "text": " C'est l'idée qu'on est sur un sentier qui a été établi, soit volontairement en marchant dessus, soit en définissant des bornes, en définissant une signalétique.", + "tokens": [ + 50364, + 383, + 6, + 377, + 287, + 6, + 34281, + 421, + 6, + 266, + 871, + 1022, + 517, + 2279, + 811, + 1956, + 257, + 8862, + 4823, + 455, + 2081, + 11, + 12703, + 40005, + 9020, + 518, + 465, + 8368, + 394, + 30677, + 11, + 12703, + 465, + 40763, + 29492, + 730, + 4232, + 279, + 11, + 465, + 40763, + 29492, + 2251, + 6358, + 42379, + 13, + 51414 + ], + "temperature": 0.0, + "avg_logprob": -0.10392295320828755, + "compression_ratio": 1.3916666666666666, + "no_speech_prob": 3.9441460103262216e-05, + "confidence": 0.93, + "words": [ + { + "text": "C'est", + "start": 168.86, + "end": 169.1, + "confidence": 0.952 + }, + { + "text": "l'idée", + "start": 169.1, + "end": 169.34, + "confidence": 0.992 + }, + { + "text": "qu'on", + "start": 169.34, + "end": 169.7, + "confidence": 0.824 + }, + { + "text": "est", + "start": 169.7, + "end": 169.88, + "confidence": 0.631 + }, + { + "text": "sur", + "start": 169.88, + "end": 170.0, + "confidence": 0.993 + }, + { + "text": "un", + "start": 170.0, + "end": 170.54, + "confidence": 0.998 + }, + { + "text": "sentier", + "start": 170.54, + "end": 170.78, + "confidence": 0.99 + }, + { + "text": "qui", + "start": 170.78, + "end": 170.84, + "confidence": 0.962 + }, + { + "text": "a", + "start": 170.84, + "end": 170.94, + "confidence": 0.98 + }, + { + "text": "été", + "start": 170.94, + "end": 171.12, + "confidence": 0.996 + }, + { + "text": "établi,", + "start": 171.12, + "end": 171.9, + "confidence": 0.995 + }, + { + "text": "soit", + "start": 171.9, + "end": 172.12, + "confidence": 0.988 + }, + { + "text": "volontairement", + "start": 172.12, + "end": 172.72, + "confidence": 0.965 + }, + { + "text": "en", + "start": 172.72, + "end": 172.8, + "confidence": 0.941 + }, + { + "text": "marchant", + "start": 172.8, + "end": 173.06, + "confidence": 0.997 + }, + { + "text": "dessus,", + "start": 173.06, + "end": 174.24, + "confidence": 0.972 + }, + { + "text": "soit", + "start": 174.24, + "end": 174.92, + "confidence": 0.996 + }, + { + "text": "en", + "start": 174.92, + "end": 175.36, + "confidence": 0.991 + }, + { + "text": "définissant", + "start": 175.36, + "end": 175.5, + "confidence": 0.983 + }, + { + "text": "des", + "start": 175.5, + "end": 175.76, + "confidence": 0.984 + }, + { + "text": "bornes,", + "start": 175.76, + "end": 176.04, + "confidence": 0.975 + }, + { + "text": "en", + "start": 176.04, + "end": 176.08, + "confidence": 0.683 + }, + { + "text": "définissant", + "start": 176.08, + "end": 176.58, + "confidence": 0.997 + }, + { + "text": "une", + "start": 176.58, + "end": 176.82, + "confidence": 0.944 + }, + { + "text": "signalétique.", + "start": 176.82, + "end": 177.42, + "confidence": 0.643 + } + ] + } + ], + "language": "fr" +} \ No newline at end of file diff --git a/tests/data/words.wav b/tests/data/words.wav new file mode 100644 index 0000000000000000000000000000000000000000..62f594013e3f01d28b73172dfa013e1180ff2ba9 Binary files /dev/null and b/tests/data/words.wav differ diff --git a/tests/data/yes_punctuations.mp3.words.json b/tests/data/yes_punctuations.mp3.words.json new file mode 100644 index 0000000000000000000000000000000000000000..64ed44959c984ee2b8ee34cc27b8924b62bf0ee4 --- /dev/null +++ b/tests/data/yes_punctuations.mp3.words.json @@ -0,0 +1,68 @@ +{ + "text": " Dis-moi, est-ce que l'avion vole?", + "segments": [ + { + "id": 0, + "seek": 0, + "start": 0.4, + "end": 2.34, + "text": " Dis-moi, est-ce que l'avion vole?", + "tokens": [ + 50364, + 4208, + 12, + 29292, + 11, + 871, + 12, + 384, + 631, + 287, + 6, + 706, + 313, + 49877, + 2506, + 50494 + ], + "temperature": 0.0, + "avg_logprob": -0.3014036907869227, + "compression_ratio": 0.8048780487804879, + "no_speech_prob": 0.05134102329611778, + "confidence": 0.925, + "words": [ + { + "text": "Dis-moi,", + "start": 0.4, + "end": 1.36, + "confidence": 0.801 + }, + { + "text": "est-ce", + "start": 1.36, + "end": 1.52, + "confidence": 0.966 + }, + { + "text": "que", + "start": 1.52, + "end": 1.64, + "confidence": 0.977 + }, + { + "text": "l'avion", + "start": 1.64, + "end": 2.02, + "confidence": 0.994 + }, + { + "text": "vole?", + "start": 2.02, + "end": 2.34, + "confidence": 0.891 + } + ] + } + ], + "language": "fr" +} \ No newline at end of file diff --git a/tests/expected/corner_cases.cpu/accurate.tiny_apollo11.mp3.words.json b/tests/expected/corner_cases.cpu/accurate.tiny_apollo11.mp3.words.json new file mode 100644 index 0000000000000000000000000000000000000000..b8cef4748a2e67b9548f033c7facf02873fcab99 --- /dev/null +++ b/tests/expected/corner_cases.cpu/accurate.tiny_apollo11.mp3.words.json @@ -0,0 +1,1481 @@ +{ + "text": " I'm all around my business and we gotta eat recommendations for you on your door to the VA We have 18A's I'm all around my business and I'm all around my business and I'm all around my business I got a little bit of a problem with that, and you want to have the advice down My goal is to reach these things, not to reach out to them and they're out of the bag And I can't see anything else, I don't want to hear anything else I'm at the least, I'm not making the tag I can't see anything else Yeah, I'm taking a heavy out of the bag We're on the highway, we're on the highway, we're on the highway We're on the highway, we're on the highway We want to hear that, this is the case, we know we can't get that much of our business So I guess we'll be somewhere in our place, but it's not over Okay, it's not over, it's not over, it's not over", + "segments": [ + { + "id": 0, + "seek": 0, + "start": 0.6, + "end": 5.28, + "text": " I'm all around my business and we gotta eat recommendations for you on your door to the VA", + "tokens": [ + 286, + 478, + 439, + 926, + 452, + 1606, + 293, + 321, + 3428, + 1862, + 10434, + 337, + 291, + 322, + 428, + 2853, + 281, + 264, + 18527 + ], + "temperature": 0.0, + "avg_logprob": -0.4247800021701389, + "compression_ratio": 6.281818181818182, + "no_speech_prob": 0.3518604338169098, + "confidence": 0.27, + "words": [ + { + "text": "I'm", + "start": 0.6, + "end": 0.74, + "confidence": 0.168 + }, + { + "text": "all", + "start": 0.74, + "end": 1.02, + "confidence": 0.083 + }, + { + "text": "around", + "start": 1.02, + "end": 1.24, + "confidence": 0.103 + }, + { + "text": "my", + "start": 1.24, + "end": 1.42, + "confidence": 0.129 + }, + { + "text": "business", + "start": 1.42, + "end": 1.62, + "confidence": 0.339 + }, + { + "text": "and", + "start": 1.62, + "end": 1.9, + "confidence": 0.613 + }, + { + "text": "we", + "start": 1.9, + "end": 1.98, + "confidence": 0.938 + }, + { + "text": "gotta", + "start": 1.98, + "end": 2.16, + "confidence": 0.402 + }, + { + "text": "eat", + "start": 2.16, + "end": 2.38, + "confidence": 0.246 + }, + { + "text": "recommendations", + "start": 2.38, + "end": 2.84, + "confidence": 0.111 + }, + { + "text": "for", + "start": 2.84, + "end": 3.48, + "confidence": 0.236 + }, + { + "text": "you", + "start": 3.48, + "end": 3.62, + "confidence": 0.95 + }, + { + "text": "on", + "start": 3.62, + "end": 3.82, + "confidence": 0.774 + }, + { + "text": "your", + "start": 3.82, + "end": 4.36, + "confidence": 0.598 + }, + { + "text": "door", + "start": 4.36, + "end": 4.62, + "confidence": 0.113 + }, + { + "text": "to", + "start": 4.62, + "end": 4.84, + "confidence": 0.194 + }, + { + "text": "the", + "start": 4.84, + "end": 4.9, + "confidence": 0.457 + }, + { + "text": "VA", + "start": 4.9, + "end": 5.28, + "confidence": 0.23 + } + ] + }, + { + "id": 1, + "seek": 0, + "start": 5.28, + "end": 6.82, + "text": " We have 18A's", + "tokens": [ + 492, + 362, + 2443, + 32, + 311 + ], + "temperature": 0.0, + "avg_logprob": -0.4247800021701389, + "compression_ratio": 6.281818181818182, + "no_speech_prob": 0.3518604338169098, + "confidence": 0.189, + "words": [ + { + "text": "We", + "start": 5.28, + "end": 5.6, + "confidence": 0.056 + }, + { + "text": "have", + "start": 5.6, + "end": 5.72, + "confidence": 0.61 + }, + { + "text": "18A's", + "start": 5.72, + "end": 6.82, + "confidence": 0.191 + } + ] + }, + { + "id": 2, + "seek": 700, + "start": 7.02, + "end": 24.14, + "text": " I'm all around my business and I'm all around my business and I'm all around my business", + "tokens": [ + 286, + 478, + 439, + 926, + 452, + 1606, + 293, + 286, + 478, + 439, + 926, + 452, + 1606, + 293, + 286, + 478, + 439, + 926, + 452, + 1606 + ], + "temperature": 0.0, + "avg_logprob": -0.8006511529286703, + "compression_ratio": 2.1463414634146343, + "no_speech_prob": 0.1812065988779068, + "confidence": 0.476, + "words": [ + { + "text": "I'm", + "start": 7.02, + "end": 11.1, + "confidence": 0.124 + }, + { + "text": "all", + "start": 11.1, + "end": 13.62, + "confidence": 0.143 + }, + { + "text": "around", + "start": 13.62, + "end": 13.66, + "confidence": 0.517 + }, + { + "text": "my", + "start": 13.66, + "end": 13.7, + "confidence": 0.294 + }, + { + "text": "business", + "start": 13.7, + "end": 13.74, + "confidence": 0.931 + }, + { + "text": "and", + "start": 13.74, + "end": 14.08, + "confidence": 0.249 + }, + { + "text": "I'm", + "start": 14.08, + "end": 14.48, + "confidence": 0.379 + }, + { + "text": "all", + "start": 14.48, + "end": 14.68, + "confidence": 0.368 + }, + { + "text": "around", + "start": 14.68, + "end": 14.72, + "confidence": 0.892 + }, + { + "text": "my", + "start": 14.72, + "end": 14.76, + "confidence": 0.743 + }, + { + "text": "business", + "start": 14.76, + "end": 14.8, + "confidence": 0.981 + }, + { + "text": "and", + "start": 14.8, + "end": 15.04, + "confidence": 0.391 + }, + { + "text": "I'm", + "start": 15.04, + "end": 16.06, + "confidence": 0.861 + }, + { + "text": "all", + "start": 16.06, + "end": 16.12, + "confidence": 0.674 + }, + { + "text": "around", + "start": 16.12, + "end": 16.8, + "confidence": 0.932 + }, + { + "text": "my", + "start": 16.8, + "end": 21.82, + "confidence": 0.765 + }, + { + "text": "business", + "start": 21.82, + "end": 24.14, + "confidence": 0.977 + } + ] + }, + { + "id": 3, + "seek": 3100, + "start": 31.24, + "end": 36.52, + "text": " I got a little bit of a problem with that, and you want to have the advice down", + "tokens": [ + 286, + 658, + 257, + 707, + 857, + 295, + 257, + 1154, + 365, + 300, + 11, + 293, + 291, + 528, + 281, + 362, + 264, + 5192, + 760 + ], + "temperature": 0.0, + "avg_logprob": -1.0431414517489346, + "compression_ratio": 1.8074866310160427, + "no_speech_prob": 0.09527108818292618, + "confidence": 0.336, + "words": [ + { + "text": "I", + "start": 31.24, + "end": 31.66, + "confidence": 0.447 + }, + { + "text": "got", + "start": 31.66, + "end": 31.96, + "confidence": 0.219 + }, + { + "text": "a", + "start": 31.96, + "end": 33.32, + "confidence": 0.159 + }, + { + "text": "little", + "start": 33.32, + "end": 33.52, + "confidence": 0.104 + }, + { + "text": "bit", + "start": 33.52, + "end": 33.74, + "confidence": 0.919 + }, + { + "text": "of", + "start": 33.74, + "end": 33.86, + "confidence": 0.903 + }, + { + "text": "a", + "start": 33.86, + "end": 33.94, + "confidence": 0.347 + }, + { + "text": "problem", + "start": 33.94, + "end": 34.12, + "confidence": 0.226 + }, + { + "text": "with", + "start": 34.12, + "end": 34.38, + "confidence": 0.395 + }, + { + "text": "that,", + "start": 34.38, + "end": 34.52, + "confidence": 0.175 + }, + { + "text": "and", + "start": 34.52, + "end": 34.58, + "confidence": 0.331 + }, + { + "text": "you", + "start": 34.58, + "end": 34.7, + "confidence": 0.511 + }, + { + "text": "want", + "start": 34.7, + "end": 35.0, + "confidence": 0.533 + }, + { + "text": "to", + "start": 35.0, + "end": 35.06, + "confidence": 0.568 + }, + { + "text": "have", + "start": 35.06, + "end": 35.36, + "confidence": 0.857 + }, + { + "text": "the", + "start": 35.36, + "end": 35.52, + "confidence": 0.519 + }, + { + "text": "advice", + "start": 35.52, + "end": 35.88, + "confidence": 0.077 + }, + { + "text": "down", + "start": 35.88, + "end": 36.52, + "confidence": 0.231 + } + ] + }, + { + "id": 4, + "seek": 3100, + "start": 37.68, + "end": 41.92, + "text": " My goal is to reach these things, not to reach out to them and they're out of the bag", + "tokens": [ + 1222, + 3387, + 307, + 281, + 2524, + 613, + 721, + 11, + 406, + 281, + 2524, + 484, + 281, + 552, + 293, + 436, + 434, + 484, + 295, + 264, + 3411 + ], + "temperature": 0.0, + "avg_logprob": -1.0431414517489346, + "compression_ratio": 1.8074866310160427, + "no_speech_prob": 0.09527108818292618, + "confidence": 0.312, + "words": [ + { + "text": "My", + "start": 37.68, + "end": 38.04, + "confidence": 0.443 + }, + { + "text": "goal", + "start": 38.04, + "end": 38.14, + "confidence": 0.106 + }, + { + "text": "is", + "start": 38.14, + "end": 38.34, + "confidence": 0.697 + }, + { + "text": "to", + "start": 38.34, + "end": 38.68, + "confidence": 0.952 + }, + { + "text": "reach", + "start": 38.68, + "end": 38.84, + "confidence": 0.185 + }, + { + "text": "these", + "start": 38.84, + "end": 39.12, + "confidence": 0.19 + }, + { + "text": "things,", + "start": 39.12, + "end": 39.62, + "confidence": 0.06 + }, + { + "text": "not", + "start": 39.62, + "end": 40.1, + "confidence": 0.865 + }, + { + "text": "to", + "start": 40.1, + "end": 40.22, + "confidence": 0.13 + }, + { + "text": "reach", + "start": 40.22, + "end": 40.36, + "confidence": 0.433 + }, + { + "text": "out", + "start": 40.36, + "end": 40.58, + "confidence": 0.376 + }, + { + "text": "to", + "start": 40.58, + "end": 40.72, + "confidence": 0.771 + }, + { + "text": "them", + "start": 40.72, + "end": 40.84, + "confidence": 0.296 + }, + { + "text": "and", + "start": 40.84, + "end": 40.88, + "confidence": 0.254 + }, + { + "text": "they're", + "start": 40.88, + "end": 41.1, + "confidence": 0.244 + }, + { + "text": "out", + "start": 41.1, + "end": 41.34, + "confidence": 0.162 + }, + { + "text": "of", + "start": 41.34, + "end": 41.58, + "confidence": 0.722 + }, + { + "text": "the", + "start": 41.58, + "end": 41.68, + "confidence": 0.562 + }, + { + "text": "bag", + "start": 41.68, + "end": 41.92, + "confidence": 0.277 + } + ] + }, + { + "id": 5, + "seek": 3100, + "start": 43.52, + "end": 47.08, + "text": " And I can't see anything else, I don't want to hear anything else", + "tokens": [ + 400, + 286, + 393, + 380, + 536, + 1340, + 1646, + 11, + 286, + 500, + 380, + 528, + 281, + 1568, + 1340, + 1646 + ], + "temperature": 0.0, + "avg_logprob": -1.0431414517489346, + "compression_ratio": 1.8074866310160427, + "no_speech_prob": 0.09527108818292618, + "confidence": 0.326, + "words": [ + { + "text": "And", + "start": 43.52, + "end": 43.56, + "confidence": 0.363 + }, + { + "text": "I", + "start": 43.56, + "end": 44.12, + "confidence": 0.396 + }, + { + "text": "can't", + "start": 44.12, + "end": 44.9, + "confidence": 0.248 + }, + { + "text": "see", + "start": 44.9, + "end": 45.08, + "confidence": 0.22 + }, + { + "text": "anything", + "start": 45.08, + "end": 45.64, + "confidence": 0.254 + }, + { + "text": "else,", + "start": 45.64, + "end": 45.68, + "confidence": 0.295 + }, + { + "text": "I", + "start": 45.68, + "end": 46.4, + "confidence": 0.191 + }, + { + "text": "don't", + "start": 46.4, + "end": 46.56, + "confidence": 0.615 + }, + { + "text": "want", + "start": 46.56, + "end": 46.6, + "confidence": 0.269 + }, + { + "text": "to", + "start": 46.6, + "end": 46.64, + "confidence": 0.744 + }, + { + "text": "hear", + "start": 46.64, + "end": 46.76, + "confidence": 0.262 + }, + { + "text": "anything", + "start": 46.76, + "end": 46.88, + "confidence": 0.287 + }, + { + "text": "else", + "start": 46.88, + "end": 47.08, + "confidence": 0.311 + } + ] + }, + { + "id": 6, + "seek": 3100, + "start": 48.24, + "end": 49.68, + "text": " I'm at the least, I'm not making the tag", + "tokens": [ + 286, + 478, + 412, + 264, + 1935, + 11, + 286, + 478, + 406, + 1455, + 264, + 6162 + ], + "temperature": 0.0, + "avg_logprob": -1.0431414517489346, + "compression_ratio": 1.8074866310160427, + "no_speech_prob": 0.09527108818292618, + "confidence": 0.379, + "words": [ + { + "text": "I'm", + "start": 48.24, + "end": 48.48, + "confidence": 0.231 + }, + { + "text": "at", + "start": 48.48, + "end": 48.52, + "confidence": 0.206 + }, + { + "text": "the", + "start": 48.52, + "end": 48.68, + "confidence": 0.811 + }, + { + "text": "least,", + "start": 48.68, + "end": 48.94, + "confidence": 0.235 + }, + { + "text": "I'm", + "start": 48.94, + "end": 49.0, + "confidence": 0.424 + }, + { + "text": "not", + "start": 49.0, + "end": 49.12, + "confidence": 0.938 + }, + { + "text": "making", + "start": 49.12, + "end": 49.26, + "confidence": 0.293 + }, + { + "text": "the", + "start": 49.26, + "end": 49.44, + "confidence": 0.747 + }, + { + "text": "tag", + "start": 49.44, + "end": 49.68, + "confidence": 0.298 + } + ] + }, + { + "id": 7, + "seek": 3100, + "start": 51.46, + "end": 52.88, + "text": " I can't see anything else", + "tokens": [ + 286, + 393, + 380, + 536, + 1340, + 1646 + ], + "temperature": 0.0, + "avg_logprob": -1.0431414517489346, + "compression_ratio": 1.8074866310160427, + "no_speech_prob": 0.09527108818292618, + "confidence": 0.412, + "words": [ + { + "text": "I", + "start": 51.46, + "end": 51.5, + "confidence": 0.173 + }, + { + "text": "can't", + "start": 51.5, + "end": 51.86, + "confidence": 0.374 + }, + { + "text": "see", + "start": 51.86, + "end": 52.2, + "confidence": 0.34 + }, + { + "text": "anything", + "start": 52.2, + "end": 52.5, + "confidence": 0.915 + }, + { + "text": "else", + "start": 52.5, + "end": 52.88, + "confidence": 0.653 + } + ] + }, + { + "id": 8, + "seek": 3100, + "start": 53.16, + "end": 54.7, + "text": " Yeah, I'm taking a heavy out of the bag", + "tokens": [ + 865, + 11, + 286, + 478, + 1940, + 257, + 4676, + 484, + 295, + 264, + 3411 + ], + "temperature": 0.0, + "avg_logprob": -1.0431414517489346, + "compression_ratio": 1.8074866310160427, + "no_speech_prob": 0.09527108818292618, + "confidence": 0.28, + "words": [ + { + "text": "Yeah,", + "start": 53.16, + "end": 53.38, + "confidence": 0.569 + }, + { + "text": "I'm", + "start": 53.38, + "end": 53.46, + "confidence": 0.59 + }, + { + "text": "taking", + "start": 53.46, + "end": 53.64, + "confidence": 0.881 + }, + { + "text": "a", + "start": 53.64, + "end": 53.76, + "confidence": 0.177 + }, + { + "text": "heavy", + "start": 53.76, + "end": 54.04, + "confidence": 0.1 + }, + { + "text": "out", + "start": 54.04, + "end": 54.28, + "confidence": 0.073 + }, + { + "text": "of", + "start": 54.28, + "end": 54.42, + "confidence": 0.948 + }, + { + "text": "the", + "start": 54.42, + "end": 54.6, + "confidence": 0.168 + }, + { + "text": "bag", + "start": 54.6, + "end": 54.7, + "confidence": 0.084 + } + ] + }, + { + "id": 9, + "seek": 5600, + "start": 56.46, + "end": 59.78, + "text": " We're on the highway, we're on the highway, we're on the highway", + "tokens": [ + 492, + 434, + 322, + 264, + 17205, + 11, + 321, + 434, + 322, + 264, + 17205, + 11, + 321, + 434, + 322, + 264, + 17205 + ], + "temperature": 0.0, + "avg_logprob": -0.750541016295716, + "compression_ratio": 1.901840490797546, + "no_speech_prob": 0.01289769820868969, + "confidence": 0.498, + "words": [ + { + "text": "We're", + "start": 56.46, + "end": 56.94, + "confidence": 0.281 + }, + { + "text": "on", + "start": 56.94, + "end": 57.18, + "confidence": 0.116 + }, + { + "text": "the", + "start": 57.18, + "end": 57.26, + "confidence": 0.261 + }, + { + "text": "highway,", + "start": 57.26, + "end": 57.78, + "confidence": 0.129 + }, + { + "text": "we're", + "start": 57.78, + "end": 58.32, + "confidence": 0.604 + }, + { + "text": "on", + "start": 58.32, + "end": 58.44, + "confidence": 0.813 + }, + { + "text": "the", + "start": 58.44, + "end": 58.74, + "confidence": 0.861 + }, + { + "text": "highway,", + "start": 58.74, + "end": 58.94, + "confidence": 0.925 + }, + { + "text": "we're", + "start": 58.94, + "end": 58.98, + "confidence": 0.742 + }, + { + "text": "on", + "start": 58.98, + "end": 59.02, + "confidence": 0.82 + }, + { + "text": "the", + "start": 59.02, + "end": 59.18, + "confidence": 0.937 + }, + { + "text": "highway", + "start": 59.18, + "end": 59.78, + "confidence": 0.948 + } + ] + }, + { + "id": 10, + "seek": 5600, + "start": 60.52, + "end": 66.02, + "text": " We're on the highway, we're on the highway", + "tokens": [ + 492, + 434, + 322, + 264, + 17205, + 11, + 321, + 434, + 322, + 264, + 17205 + ], + "temperature": 0.0, + "avg_logprob": -0.750541016295716, + "compression_ratio": 1.901840490797546, + "no_speech_prob": 0.01289769820868969, + "confidence": 0.785, + "words": [ + { + "text": "We're", + "start": 60.52, + "end": 60.66, + "confidence": 0.62 + }, + { + "text": "on", + "start": 60.66, + "end": 60.84, + "confidence": 0.437 + }, + { + "text": "the", + "start": 60.84, + "end": 60.88, + "confidence": 0.94 + }, + { + "text": "highway,", + "start": 60.88, + "end": 61.16, + "confidence": 0.977 + }, + { + "text": "we're", + "start": 61.16, + "end": 63.48, + "confidence": 0.865 + }, + { + "text": "on", + "start": 63.48, + "end": 63.62, + "confidence": 0.911 + }, + { + "text": "the", + "start": 63.62, + "end": 63.7, + "confidence": 0.892 + }, + { + "text": "highway", + "start": 63.7, + "end": 66.02, + "confidence": 0.945 + } + ] + }, + { + "id": 11, + "seek": 5600, + "start": 66.02, + "end": 69.04, + "text": " We want to hear that, this is the case, we know we can't get that much of our business", + "tokens": [ + 492, + 528, + 281, + 1568, + 300, + 11, + 341, + 307, + 264, + 1389, + 11, + 321, + 458, + 321, + 393, + 380, + 483, + 300, + 709, + 295, + 527, + 1606 + ], + "temperature": 0.0, + "avg_logprob": -0.750541016295716, + "compression_ratio": 1.901840490797546, + "no_speech_prob": 0.01289769820868969, + "confidence": 0.371, + "words": [ + { + "text": "We", + "start": 66.02, + "end": 66.06, + "confidence": 0.369 + }, + { + "text": "want", + "start": 66.06, + "end": 66.1, + "confidence": 0.335 + }, + { + "text": "to", + "start": 66.1, + "end": 66.14, + "confidence": 0.662 + }, + { + "text": "hear", + "start": 66.14, + "end": 66.18, + "confidence": 0.323 + }, + { + "text": "that,", + "start": 66.18, + "end": 66.22, + "confidence": 0.878 + }, + { + "text": "this", + "start": 66.22, + "end": 66.26, + "confidence": 0.265 + }, + { + "text": "is", + "start": 66.26, + "end": 66.3, + "confidence": 0.806 + }, + { + "text": "the", + "start": 66.3, + "end": 66.34, + "confidence": 0.286 + }, + { + "text": "case,", + "start": 66.34, + "end": 66.38, + "confidence": 0.195 + }, + { + "text": "we", + "start": 66.38, + "end": 66.92, + "confidence": 0.423 + }, + { + "text": "know", + "start": 66.92, + "end": 66.96, + "confidence": 0.736 + }, + { + "text": "we", + "start": 66.96, + "end": 67.06, + "confidence": 0.814 + }, + { + "text": "can't", + "start": 67.06, + "end": 67.3, + "confidence": 0.339 + }, + { + "text": "get", + "start": 67.3, + "end": 67.4, + "confidence": 0.219 + }, + { + "text": "that", + "start": 67.4, + "end": 67.64, + "confidence": 0.209 + }, + { + "text": "much", + "start": 67.64, + "end": 68.46, + "confidence": 0.213 + }, + { + "text": "of", + "start": 68.46, + "end": 68.7, + "confidence": 0.59 + }, + { + "text": "our", + "start": 68.7, + "end": 68.74, + "confidence": 0.679 + }, + { + "text": "business", + "start": 68.74, + "end": 69.04, + "confidence": 0.077 + } + ] + }, + { + "id": 12, + "seek": 5600, + "start": 69.04, + "end": 72.64, + "text": " So I guess we'll be somewhere in our place, but it's not over", + "tokens": [ + 407, + 286, + 2041, + 321, + 603, + 312, + 4079, + 294, + 527, + 1081, + 11, + 457, + 309, + 311, + 406, + 670 + ], + "temperature": 0.0, + "avg_logprob": -0.750541016295716, + "compression_ratio": 1.901840490797546, + "no_speech_prob": 0.01289769820868969, + "confidence": 0.435, + "words": [ + { + "text": "So", + "start": 69.04, + "end": 70.38, + "confidence": 0.736 + }, + { + "text": "I", + "start": 70.38, + "end": 70.52, + "confidence": 0.675 + }, + { + "text": "guess", + "start": 70.52, + "end": 70.68, + "confidence": 0.721 + }, + { + "text": "we'll", + "start": 70.68, + "end": 71.04, + "confidence": 0.462 + }, + { + "text": "be", + "start": 71.04, + "end": 71.22, + "confidence": 0.27 + }, + { + "text": "somewhere", + "start": 71.22, + "end": 71.36, + "confidence": 0.369 + }, + { + "text": "in", + "start": 71.36, + "end": 71.4, + "confidence": 0.107 + }, + { + "text": "our", + "start": 71.4, + "end": 71.5, + "confidence": 0.192 + }, + { + "text": "place,", + "start": 71.5, + "end": 71.92, + "confidence": 0.38 + }, + { + "text": "but", + "start": 71.92, + "end": 72.14, + "confidence": 0.431 + }, + { + "text": "it's", + "start": 72.14, + "end": 72.36, + "confidence": 0.939 + }, + { + "text": "not", + "start": 72.36, + "end": 72.4, + "confidence": 0.552 + }, + { + "text": "over", + "start": 72.4, + "end": 72.64, + "confidence": 0.308 + } + ] + }, + { + "id": 13, + "seek": 7400, + "start": 74.02, + "end": 78.4, + "text": " Okay, it's not over, it's not over, it's not over", + "tokens": [ + 50364, + 1033, + 11, + 309, + 311, + 406, + 670, + 11, + 309, + 311, + 406, + 670, + 11, + 309, + 311, + 406, + 670, + 51164 + ], + "temperature": 0.0, + "avg_logprob": -0.405017099882427, + "compression_ratio": 1.6896551724137931, + "no_speech_prob": 0.01679050177335739, + "confidence": 0.705, + "words": [ + { + "text": "Okay,", + "start": 74.02, + "end": 75.9, + "confidence": 0.147 + }, + { + "text": "it's", + "start": 75.9, + "end": 76.16, + "confidence": 0.589 + }, + { + "text": "not", + "start": 76.16, + "end": 76.22, + "confidence": 0.956 + }, + { + "text": "over,", + "start": 76.22, + "end": 76.76, + "confidence": 0.89 + }, + { + "text": "it's", + "start": 76.76, + "end": 77.08, + "confidence": 0.647 + }, + { + "text": "not", + "start": 77.08, + "end": 77.18, + "confidence": 0.897 + }, + { + "text": "over,", + "start": 77.18, + "end": 77.36, + "confidence": 0.962 + }, + { + "text": "it's", + "start": 77.36, + "end": 77.86, + "confidence": 0.869 + }, + { + "text": "not", + "start": 77.86, + "end": 78.26, + "confidence": 0.955 + }, + { + "text": "over", + "start": 78.26, + "end": 78.4, + "confidence": 0.934 + } + ] + } + ], + "language": "en" +} \ No newline at end of file diff --git a/tests/expected/corner_cases.cpu/large_apollo11.mp3.words.json b/tests/expected/corner_cases.cpu/large_apollo11.mp3.words.json new file mode 100644 index 0000000000000000000000000000000000000000..2132c86c44928d8182b1d362dfc9798acda75397 --- /dev/null +++ b/tests/expected/corner_cases.cpu/large_apollo11.mp3.words.json @@ -0,0 +1,2212 @@ +{ + "text": " Apollo 11, Houston, we got a recommendation for you on your Doige's EAs, LM EG EAs, over. Go ahead. We'd like to see it as a selected one or two on the helmet. We're gonna have it in B1, and you can put the other one on Mike's helmet, we're still seeing it. Okay. All right. We got some. We got some. We got some. We got some. We got some. We got some. We got some. We got some. We got some. We got some. We got some. We got some. We got some. We got some. We got some. We got some. We got some. We got some. We got some. We got some. We got some. We got some. We got some. We got some. We got some. We got some. We got some. Yeah, we're taking next day autumn to heal up. You won't hack me on this. You won't hack me on this. With a cover, I tried it already. Okay, fine. We weren't sure that this was a suggestion. We thought you could check it out. I'm not sure we've already done that. I guess, whatever you come up with, just let us know. Okay, no problem. Okay, no problem.", + "segments": [ + { + "id": 0, + "seek": 0, + "start": 0.52, + "end": 7.22, + "text": " Apollo 11, Houston, we got a recommendation for you on your Doige's EAs, LM EG EAs, over.", + "tokens": [ + 25187, + 2975, + 11, + 18717, + 11, + 321, + 658, + 257, + 11879, + 337, + 291, + 322, + 428, + 1144, + 328, + 68, + 311, + 462, + 10884, + 11, + 46529, + 462, + 38, + 462, + 10884, + 11, + 670, + 13 + ], + "temperature": 0.4, + "avg_logprob": -0.6255288836599766, + "compression_ratio": 1.4371584699453552, + "no_speech_prob": 0.33187487721443176, + "confidence": 0.539, + "words": [ + { + "text": "Apollo", + "start": 0.52, + "end": 0.98, + "confidence": 0.791 + }, + { + "text": "11,", + "start": 0.98, + "end": 1.54, + "confidence": 0.878 + }, + { + "text": "Houston,", + "start": 1.54, + "end": 1.98, + "confidence": 0.828 + }, + { + "text": "we", + "start": 1.98, + "end": 2.02, + "confidence": 0.892 + }, + { + "text": "got", + "start": 2.02, + "end": 2.16, + "confidence": 0.688 + }, + { + "text": "a", + "start": 2.16, + "end": 2.46, + "confidence": 0.995 + }, + { + "text": "recommendation", + "start": 2.46, + "end": 3.16, + "confidence": 0.71 + }, + { + "text": "for", + "start": 3.16, + "end": 3.6, + "confidence": 0.845 + }, + { + "text": "you", + "start": 3.6, + "end": 3.94, + "confidence": 0.86 + }, + { + "text": "on", + "start": 3.94, + "end": 3.98, + "confidence": 0.862 + }, + { + "text": "your", + "start": 3.98, + "end": 4.28, + "confidence": 0.767 + }, + { + "text": "Doige's", + "start": 4.28, + "end": 5.14, + "confidence": 0.261 + }, + { + "text": "EAs,", + "start": 5.14, + "end": 5.62, + "confidence": 0.347 + }, + { + "text": "LM", + "start": 5.62, + "end": 5.7, + "confidence": 0.275 + }, + { + "text": "EG", + "start": 5.7, + "end": 6.34, + "confidence": 0.3 + }, + { + "text": "EAs,", + "start": 6.34, + "end": 6.98, + "confidence": 0.695 + }, + { + "text": "over.", + "start": 6.98, + "end": 7.22, + "confidence": 0.838 + } + ] + }, + { + "id": 1, + "seek": 0, + "start": 10.84, + "end": 11.96, + "text": " Go ahead.", + "tokens": [ + 1037, + 2286, + 13 + ], + "temperature": 0.4, + "avg_logprob": -0.6255288836599766, + "compression_ratio": 1.4371584699453552, + "no_speech_prob": 0.33187487721443176, + "confidence": 0.788, + "words": [ + { + "text": "Go", + "start": 10.84, + "end": 11.06, + "confidence": 0.719 + }, + { + "text": "ahead.", + "start": 11.06, + "end": 11.96, + "confidence": 0.863 + } + ] + }, + { + "id": 2, + "seek": 0, + "start": 12.76, + "end": 17.48, + "text": " We'd like to see it as a selected one or two on the helmet.", + "tokens": [ + 492, + 1116, + 411, + 281, + 536, + 309, + 382, + 257, + 8209, + 472, + 420, + 732, + 322, + 264, + 15922, + 13 + ], + "temperature": 0.4, + "avg_logprob": -0.6255288836599766, + "compression_ratio": 1.4371584699453552, + "no_speech_prob": 0.33187487721443176, + "confidence": 0.359, + "words": [ + { + "text": "We'd", + "start": 12.76, + "end": 13.28, + "confidence": 0.31 + }, + { + "text": "like", + "start": 13.28, + "end": 13.62, + "confidence": 0.874 + }, + { + "text": "to", + "start": 13.62, + "end": 13.84, + "confidence": 0.728 + }, + { + "text": "see", + "start": 13.84, + "end": 14.14, + "confidence": 0.214 + }, + { + "text": "it", + "start": 14.14, + "end": 14.56, + "confidence": 0.067 + }, + { + "text": "as", + "start": 14.56, + "end": 14.6, + "confidence": 0.108 + }, + { + "text": "a", + "start": 14.6, + "end": 14.64, + "confidence": 0.223 + }, + { + "text": "selected", + "start": 14.64, + "end": 15.78, + "confidence": 0.136 + }, + { + "text": "one", + "start": 15.78, + "end": 16.14, + "confidence": 0.786 + }, + { + "text": "or", + "start": 16.14, + "end": 16.32, + "confidence": 0.644 + }, + { + "text": "two", + "start": 16.32, + "end": 16.6, + "confidence": 0.333 + }, + { + "text": "on", + "start": 16.6, + "end": 16.64, + "confidence": 0.858 + }, + { + "text": "the", + "start": 16.64, + "end": 16.98, + "confidence": 0.801 + }, + { + "text": "helmet.", + "start": 16.98, + "end": 17.48, + "confidence": 0.626 + } + ] + }, + { + "id": 3, + "seek": 0, + "start": 17.52, + "end": 24.34, + "text": " We're gonna have it in B1, and you can put the other one on Mike's helmet, we're still seeing it.", + "tokens": [ + 492, + 434, + 799, + 362, + 309, + 294, + 363, + 16, + 11, + 293, + 291, + 393, + 829, + 264, + 661, + 472, + 322, + 6602, + 311, + 15922, + 11, + 321, + 434, + 920, + 2577, + 309, + 13 + ], + "temperature": 0.4, + "avg_logprob": -0.6255288836599766, + "compression_ratio": 1.4371584699453552, + "no_speech_prob": 0.33187487721443176, + "confidence": 0.646, + "words": [ + { + "text": "We're", + "start": 17.52, + "end": 17.94, + "confidence": 0.673 + }, + { + "text": "gonna", + "start": 17.94, + "end": 18.12, + "confidence": 0.19 + }, + { + "text": "have", + "start": 18.12, + "end": 18.3, + "confidence": 0.848 + }, + { + "text": "it", + "start": 18.3, + "end": 18.4, + "confidence": 0.317 + }, + { + "text": "in", + "start": 18.4, + "end": 18.48, + "confidence": 0.667 + }, + { + "text": "B1,", + "start": 18.48, + "end": 20.24, + "confidence": 0.883 + }, + { + "text": "and", + "start": 20.24, + "end": 20.28, + "confidence": 0.824 + }, + { + "text": "you", + "start": 20.28, + "end": 20.38, + "confidence": 0.892 + }, + { + "text": "can", + "start": 20.38, + "end": 20.56, + "confidence": 0.513 + }, + { + "text": "put", + "start": 20.56, + "end": 20.74, + "confidence": 0.895 + }, + { + "text": "the", + "start": 20.74, + "end": 20.9, + "confidence": 0.812 + }, + { + "text": "other", + "start": 20.9, + "end": 21.12, + "confidence": 0.773 + }, + { + "text": "one", + "start": 21.12, + "end": 21.42, + "confidence": 0.778 + }, + { + "text": "on", + "start": 21.42, + "end": 21.82, + "confidence": 0.905 + }, + { + "text": "Mike's", + "start": 21.82, + "end": 22.96, + "confidence": 0.876 + }, + { + "text": "helmet,", + "start": 22.96, + "end": 23.12, + "confidence": 0.772 + }, + { + "text": "we're", + "start": 23.12, + "end": 23.26, + "confidence": 0.455 + }, + { + "text": "still", + "start": 23.26, + "end": 23.42, + "confidence": 0.773 + }, + { + "text": "seeing", + "start": 23.42, + "end": 23.72, + "confidence": 0.667 + }, + { + "text": "it.", + "start": 23.72, + "end": 24.34, + "confidence": 0.243 + } + ] + }, + { + "id": 4, + "seek": 2400, + "start": 25.44, + "end": 25.48, + "text": " Okay.", + "tokens": [ + 1033, + 13 + ], + "temperature": 0.4, + "avg_logprob": -0.3070566034041388, + "compression_ratio": 9.175, + "no_speech_prob": 0.6738554835319519, + "confidence": 0.004, + "words": [ + { + "text": "Okay.", + "start": 25.44, + "end": 25.48, + "confidence": 0.004 + } + ] + }, + { + "id": 5, + "seek": 2400, + "start": 25.48, + "end": 26.0, + "text": " All right.", + "tokens": [ + 1057, + 558, + 13 + ], + "temperature": 0.4, + "avg_logprob": -0.3070566034041388, + "compression_ratio": 9.175, + "no_speech_prob": 0.6738554835319519, + "confidence": 0.281, + "words": [ + { + "text": "All", + "start": 25.48, + "end": 25.52, + "confidence": 0.093 + }, + { + "text": "right.", + "start": 25.52, + "end": 26.0, + "confidence": 0.849 + } + ] + }, + { + "id": 6, + "seek": 2400, + "start": 26.0, + "end": 27.5, + "text": " We got some.", + "tokens": [ + 492, + 658, + 512, + 13 + ], + "temperature": 0.4, + "avg_logprob": -0.3070566034041388, + "compression_ratio": 9.175, + "no_speech_prob": 0.6738554835319519, + "confidence": 0.06, + "words": [ + { + "text": "We", + "start": 26.0, + "end": 27.42, + "confidence": 0.08 + }, + { + "text": "got", + "start": 27.42, + "end": 27.46, + "confidence": 0.111 + }, + { + "text": "some.", + "start": 27.46, + "end": 27.5, + "confidence": 0.024 + } + ] + }, + { + "id": 7, + "seek": 2400, + "start": 28.4, + "end": 28.52, + "text": " We got some.", + "tokens": [ + 492, + 658, + 512, + 13 + ], + "temperature": 0.4, + "avg_logprob": -0.3070566034041388, + "compression_ratio": 9.175, + "no_speech_prob": 0.6738554835319519, + "confidence": 0.399, + "words": [ + { + "text": "We", + "start": 28.4, + "end": 28.44, + "confidence": 0.19 + }, + { + "text": "got", + "start": 28.44, + "end": 28.48, + "confidence": 0.527 + }, + { + "text": "some.", + "start": 28.48, + "end": 28.52, + "confidence": 0.633 + } + ] + }, + { + "id": 8, + "seek": 2400, + "start": 28.52, + "end": 28.96, + "text": " We got some.", + "tokens": [ + 492, + 658, + 512, + 13 + ], + "temperature": 0.4, + "avg_logprob": -0.3070566034041388, + "compression_ratio": 9.175, + "no_speech_prob": 0.6738554835319519, + "confidence": 0.468, + "words": [ + { + "text": "We", + "start": 28.52, + "end": 28.56, + "confidence": 0.231 + }, + { + "text": "got", + "start": 28.56, + "end": 28.6, + "confidence": 0.608 + }, + { + "text": "some.", + "start": 28.6, + "end": 28.96, + "confidence": 0.731 + } + ] + }, + { + "id": 9, + "seek": 2400, + "start": 28.96, + "end": 30.01, + "text": " We got some.", + "tokens": [ + 492, + 658, + 512, + 13 + ], + "temperature": 0.4, + "avg_logprob": -0.3070566034041388, + "compression_ratio": 9.175, + "no_speech_prob": 0.6738554835319519, + "confidence": 0.529, + "words": [ + { + "text": "We", + "start": 28.96, + "end": 29.0, + "confidence": 0.288 + }, + { + "text": "got", + "start": 29.0, + "end": 29.04, + "confidence": 0.675 + }, + { + "text": "some.", + "start": 29.04, + "end": 30.01, + "confidence": 0.761 + } + ] + }, + { + "id": 10, + "seek": 2400, + "start": 30.01, + "end": 31.5, + "text": " We got some.", + "tokens": [ + 492, + 658, + 512, + 13 + ], + "temperature": 0.4, + "avg_logprob": -0.3070566034041388, + "compression_ratio": 9.175, + "no_speech_prob": 0.6738554835319519, + "confidence": 0.596, + "words": [ + { + "text": "We", + "start": 30.01, + "end": 31.42, + "confidence": 0.378 + }, + { + "text": "got", + "start": 31.42, + "end": 31.46, + "confidence": 0.721 + }, + { + "text": "some.", + "start": 31.46, + "end": 31.5, + "confidence": 0.776 + } + ] + }, + { + "id": 11, + "seek": 2400, + "start": 31.5, + "end": 32.48, + "text": " We got some.", + "tokens": [ + 492, + 658, + 512, + 13 + ], + "temperature": 0.4, + "avg_logprob": -0.3070566034041388, + "compression_ratio": 9.175, + "no_speech_prob": 0.6738554835319519, + "confidence": 0.654, + "words": [ + { + "text": "We", + "start": 31.5, + "end": 32.14, + "confidence": 0.47 + }, + { + "text": "got", + "start": 32.14, + "end": 32.18, + "confidence": 0.757 + }, + { + "text": "some.", + "start": 32.18, + "end": 32.48, + "confidence": 0.787 + } + ] + }, + { + "id": 12, + "seek": 2400, + "start": 32.76, + "end": 33.26, + "text": " We got some.", + "tokens": [ + 492, + 658, + 512, + 13 + ], + "temperature": 0.4, + "avg_logprob": -0.3070566034041388, + "compression_ratio": 9.175, + "no_speech_prob": 0.6738554835319519, + "confidence": 0.707, + "words": [ + { + "text": "We", + "start": 32.76, + "end": 33.0, + "confidence": 0.573 + }, + { + "text": "got", + "start": 33.0, + "end": 33.22, + "confidence": 0.786 + }, + { + "text": "some.", + "start": 33.22, + "end": 33.26, + "confidence": 0.786 + } + ] + }, + { + "id": 13, + "seek": 2400, + "start": 33.26, + "end": 34.26, + "text": " We got some.", + "tokens": [ + 492, + 658, + 512, + 13 + ], + "temperature": 0.4, + "avg_logprob": -0.3070566034041388, + "compression_ratio": 9.175, + "no_speech_prob": 0.6738554835319519, + "confidence": 0.743, + "words": [ + { + "text": "We", + "start": 33.26, + "end": 33.3, + "confidence": 0.637 + }, + { + "text": "got", + "start": 33.3, + "end": 33.58, + "confidence": 0.811 + }, + { + "text": "some.", + "start": 33.58, + "end": 34.26, + "confidence": 0.794 + } + ] + }, + { + "id": 14, + "seek": 2400, + "start": 34.52, + "end": 35.06, + "text": " We got some.", + "tokens": [ + 492, + 658, + 512, + 13 + ], + "temperature": 0.4, + "avg_logprob": -0.3070566034041388, + "compression_ratio": 9.175, + "no_speech_prob": 0.6738554835319519, + "confidence": 0.761, + "words": [ + { + "text": "We", + "start": 34.52, + "end": 34.68, + "confidence": 0.672 + }, + { + "text": "got", + "start": 34.68, + "end": 35.02, + "confidence": 0.828 + }, + { + "text": "some.", + "start": 35.02, + "end": 35.06, + "confidence": 0.793 + } + ] + }, + { + "id": 15, + "seek": 2400, + "start": 35.18, + "end": 36.03, + "text": " We got some.", + "tokens": [ + 492, + 658, + 512, + 13 + ], + "temperature": 0.4, + "avg_logprob": -0.3070566034041388, + "compression_ratio": 9.175, + "no_speech_prob": 0.6738554835319519, + "confidence": 0.774, + "words": [ + { + "text": "We", + "start": 35.18, + "end": 35.48, + "confidence": 0.694 + }, + { + "text": "got", + "start": 35.48, + "end": 35.78, + "confidence": 0.843 + }, + { + "text": "some.", + "start": 35.78, + "end": 36.03, + "confidence": 0.792 + } + ] + }, + { + "id": 16, + "seek": 2400, + "start": 36.03, + "end": 36.16, + "text": " We got some.", + "tokens": [ + 492, + 658, + 512, + 13 + ], + "temperature": 0.4, + "avg_logprob": -0.3070566034041388, + "compression_ratio": 9.175, + "no_speech_prob": 0.6738554835319519, + "confidence": 0.787, + "words": [ + { + "text": "We", + "start": 36.03, + "end": 36.07, + "confidence": 0.714 + }, + { + "text": "got", + "start": 36.07, + "end": 36.11, + "confidence": 0.853 + }, + { + "text": "some.", + "start": 36.11, + "end": 36.16, + "confidence": 0.8 + } + ] + }, + { + "id": 17, + "seek": 2400, + "start": 37.66, + "end": 38.48, + "text": " We got some.", + "tokens": [ + 492, + 658, + 512, + 13 + ], + "temperature": 0.4, + "avg_logprob": -0.3070566034041388, + "compression_ratio": 9.175, + "no_speech_prob": 0.6738554835319519, + "confidence": 0.798, + "words": [ + { + "text": "We", + "start": 37.66, + "end": 38.0, + "confidence": 0.741 + }, + { + "text": "got", + "start": 38.0, + "end": 38.16, + "confidence": 0.86 + }, + { + "text": "some.", + "start": 38.16, + "end": 38.48, + "confidence": 0.797 + } + ] + }, + { + "id": 18, + "seek": 2400, + "start": 38.48, + "end": 39.2, + "text": " We got some.", + "tokens": [ + 492, + 658, + 512, + 13 + ], + "temperature": 0.4, + "avg_logprob": -0.3070566034041388, + "compression_ratio": 9.175, + "no_speech_prob": 0.6738554835319519, + "confidence": 0.798, + "words": [ + { + "text": "We", + "start": 38.48, + "end": 38.52, + "confidence": 0.739 + }, + { + "text": "got", + "start": 38.52, + "end": 38.56, + "confidence": 0.861 + }, + { + "text": "some.", + "start": 38.56, + "end": 39.2, + "confidence": 0.799 + } + ] + }, + { + "id": 19, + "seek": 2400, + "start": 40.16, + "end": 40.48, + "text": " We got some.", + "tokens": [ + 492, + 658, + 512, + 13 + ], + "temperature": 0.4, + "avg_logprob": -0.3070566034041388, + "compression_ratio": 9.175, + "no_speech_prob": 0.6738554835319519, + "confidence": 0.802, + "words": [ + { + "text": "We", + "start": 40.16, + "end": 40.2, + "confidence": 0.752 + }, + { + "text": "got", + "start": 40.2, + "end": 40.44, + "confidence": 0.862 + }, + { + "text": "some.", + "start": 40.44, + "end": 40.48, + "confidence": 0.797 + } + ] + }, + { + "id": 20, + "seek": 2400, + "start": 40.48, + "end": 40.68, + "text": " We got some.", + "tokens": [ + 492, + 658, + 512, + 13 + ], + "temperature": 0.4, + "avg_logprob": -0.3070566034041388, + "compression_ratio": 9.175, + "no_speech_prob": 0.6738554835319519, + "confidence": 0.802, + "words": [ + { + "text": "We", + "start": 40.48, + "end": 40.52, + "confidence": 0.751 + }, + { + "text": "got", + "start": 40.52, + "end": 40.56, + "confidence": 0.865 + }, + { + "text": "some.", + "start": 40.56, + "end": 40.68, + "confidence": 0.795 + } + ] + }, + { + "id": 21, + "seek": 2400, + "start": 41.36, + "end": 41.96, + "text": " We got some.", + "tokens": [ + 492, + 658, + 512, + 13 + ], + "temperature": 0.4, + "avg_logprob": -0.3070566034041388, + "compression_ratio": 9.175, + "no_speech_prob": 0.6738554835319519, + "confidence": 0.812, + "words": [ + { + "text": "We", + "start": 41.36, + "end": 41.4, + "confidence": 0.771 + }, + { + "text": "got", + "start": 41.4, + "end": 41.44, + "confidence": 0.871 + }, + { + "text": "some.", + "start": 41.44, + "end": 41.96, + "confidence": 0.798 + } + ] + }, + { + "id": 22, + "seek": 2400, + "start": 41.96, + "end": 42.08, + "text": " We got some.", + "tokens": [ + 492, + 658, + 512, + 13 + ], + "temperature": 0.4, + "avg_logprob": -0.3070566034041388, + "compression_ratio": 9.175, + "no_speech_prob": 0.6738554835319519, + "confidence": 0.811, + "words": [ + { + "text": "We", + "start": 41.96, + "end": 42.0, + "confidence": 0.766 + }, + { + "text": "got", + "start": 42.0, + "end": 42.04, + "confidence": 0.873 + }, + { + "text": "some.", + "start": 42.04, + "end": 42.08, + "confidence": 0.797 + } + ] + }, + { + "id": 23, + "seek": 2400, + "start": 43.84, + "end": 44.48, + "text": " We got some.", + "tokens": [ + 492, + 658, + 512, + 13 + ], + "temperature": 0.4, + "avg_logprob": -0.3070566034041388, + "compression_ratio": 9.175, + "no_speech_prob": 0.6738554835319519, + "confidence": 0.821, + "words": [ + { + "text": "We", + "start": 43.84, + "end": 44.02, + "confidence": 0.782 + }, + { + "text": "got", + "start": 44.02, + "end": 44.28, + "confidence": 0.876 + }, + { + "text": "some.", + "start": 44.28, + "end": 44.48, + "confidence": 0.806 + } + ] + }, + { + "id": 24, + "seek": 2400, + "start": 44.56, + "end": 45.03, + "text": " We got some.", + "tokens": [ + 492, + 658, + 512, + 13 + ], + "temperature": 0.4, + "avg_logprob": -0.3070566034041388, + "compression_ratio": 9.175, + "no_speech_prob": 0.6738554835319519, + "confidence": 0.827, + "words": [ + { + "text": "We", + "start": 44.56, + "end": 44.6, + "confidence": 0.799 + }, + { + "text": "got", + "start": 44.6, + "end": 44.64, + "confidence": 0.88 + }, + { + "text": "some.", + "start": 44.64, + "end": 45.03, + "confidence": 0.804 + } + ] + }, + { + "id": 25, + "seek": 2400, + "start": 45.03, + "end": 45.15, + "text": " We got some.", + "tokens": [ + 492, + 658, + 512, + 13 + ], + "temperature": 0.4, + "avg_logprob": -0.3070566034041388, + "compression_ratio": 9.175, + "no_speech_prob": 0.6738554835319519, + "confidence": 0.828, + "words": [ + { + "text": "We", + "start": 45.03, + "end": 45.07, + "confidence": 0.802 + }, + { + "text": "got", + "start": 45.07, + "end": 45.11, + "confidence": 0.881 + }, + { + "text": "some.", + "start": 45.11, + "end": 45.15, + "confidence": 0.802 + } + ] + }, + { + "id": 26, + "seek": 2400, + "start": 46.24, + "end": 47.08, + "text": " We got some.", + "tokens": [ + 492, + 658, + 512, + 13 + ], + "temperature": 0.4, + "avg_logprob": -0.3070566034041388, + "compression_ratio": 9.175, + "no_speech_prob": 0.6738554835319519, + "confidence": 0.826, + "words": [ + { + "text": "We", + "start": 46.24, + "end": 46.44, + "confidence": 0.796 + }, + { + "text": "got", + "start": 46.44, + "end": 46.8, + "confidence": 0.883 + }, + { + "text": "some.", + "start": 46.8, + "end": 47.08, + "confidence": 0.801 + } + ] + }, + { + "id": 27, + "seek": 2400, + "start": 47.96, + "end": 48.08, + "text": " We got some.", + "tokens": [ + 492, + 658, + 512, + 13 + ], + "temperature": 0.4, + "avg_logprob": -0.3070566034041388, + "compression_ratio": 9.175, + "no_speech_prob": 0.6738554835319519, + "confidence": 0.827, + "words": [ + { + "text": "We", + "start": 47.96, + "end": 48.0, + "confidence": 0.805 + }, + { + "text": "got", + "start": 48.0, + "end": 48.04, + "confidence": 0.886 + }, + { + "text": "some.", + "start": 48.04, + "end": 48.08, + "confidence": 0.795 + } + ] + }, + { + "id": 28, + "seek": 2400, + "start": 48.3, + "end": 48.74, + "text": " We got some.", + "tokens": [ + 492, + 658, + 512, + 13 + ], + "temperature": 0.4, + "avg_logprob": -0.3070566034041388, + "compression_ratio": 9.175, + "no_speech_prob": 0.6738554835319519, + "confidence": 0.829, + "words": [ + { + "text": "We", + "start": 48.3, + "end": 48.6, + "confidence": 0.801 + }, + { + "text": "got", + "start": 48.6, + "end": 48.66, + "confidence": 0.887 + }, + { + "text": "some.", + "start": 48.66, + "end": 48.74, + "confidence": 0.802 + } + ] + }, + { + "id": 29, + "seek": 2400, + "start": 50.16, + "end": 50.5, + "text": " We got some.", + "tokens": [ + 492, + 658, + 512, + 13 + ], + "temperature": 0.4, + "avg_logprob": -0.3070566034041388, + "compression_ratio": 9.175, + "no_speech_prob": 0.6738554835319519, + "confidence": 0.832, + "words": [ + { + "text": "We", + "start": 50.16, + "end": 50.42, + "confidence": 0.809 + }, + { + "text": "got", + "start": 50.42, + "end": 50.46, + "confidence": 0.888 + }, + { + "text": "some.", + "start": 50.46, + "end": 50.5, + "confidence": 0.804 + } + ] + }, + { + "id": 30, + "seek": 2400, + "start": 50.5, + "end": 51.36, + "text": " We got some.", + "tokens": [ + 492, + 658, + 512, + 13 + ], + "temperature": 0.4, + "avg_logprob": -0.3070566034041388, + "compression_ratio": 9.175, + "no_speech_prob": 0.6738554835319519, + "confidence": 0.832, + "words": [ + { + "text": "We", + "start": 50.5, + "end": 51.28, + "confidence": 0.808 + }, + { + "text": "got", + "start": 51.28, + "end": 51.32, + "confidence": 0.885 + }, + { + "text": "some.", + "start": 51.32, + "end": 51.36, + "confidence": 0.804 + } + ] + }, + { + "id": 31, + "seek": 2400, + "start": 51.36, + "end": 51.94, + "text": " We got some.", + "tokens": [ + 492, + 658, + 512, + 13 + ], + "temperature": 0.4, + "avg_logprob": -0.3070566034041388, + "compression_ratio": 9.175, + "no_speech_prob": 0.6738554835319519, + "confidence": 0.832, + "words": [ + { + "text": "We", + "start": 51.36, + "end": 51.86, + "confidence": 0.811 + }, + { + "text": "got", + "start": 51.86, + "end": 51.9, + "confidence": 0.885 + }, + { + "text": "some.", + "start": 51.9, + "end": 51.94, + "confidence": 0.803 + } + ] + }, + { + "id": 32, + "seek": 2400, + "start": 51.94, + "end": 52.86, + "text": " We got some.", + "tokens": [ + 492, + 658, + 512, + 13 + ], + "temperature": 0.4, + "avg_logprob": -0.3070566034041388, + "compression_ratio": 9.175, + "no_speech_prob": 0.6738554835319519, + "confidence": 0.822, + "words": [ + { + "text": "We", + "start": 51.94, + "end": 51.98, + "confidence": 0.781 + }, + { + "text": "got", + "start": 51.98, + "end": 52.32, + "confidence": 0.887 + }, + { + "text": "some.", + "start": 52.32, + "end": 52.86, + "confidence": 0.8 + } + ] + }, + { + "id": 33, + "seek": 5300, + "start": 53.16, + "end": 56.06, + "text": " Yeah, we're taking next day autumn to heal up.", + "tokens": [ + 865, + 11, + 321, + 434, + 1940, + 958, + 786, + 24604, + 281, + 10526, + 493, + 13 + ], + "temperature": 0.4, + "avg_logprob": -0.7040317565437377, + "compression_ratio": 1.7253218884120172, + "no_speech_prob": 0.4773952066898346, + "confidence": 0.348, + "words": [ + { + "text": "Yeah,", + "start": 53.16, + "end": 53.5, + "confidence": 0.243 + }, + { + "text": "we're", + "start": 53.5, + "end": 53.62, + "confidence": 0.597 + }, + { + "text": "taking", + "start": 53.62, + "end": 53.7, + "confidence": 0.694 + }, + { + "text": "next", + "start": 53.7, + "end": 53.98, + "confidence": 0.247 + }, + { + "text": "day", + "start": 53.98, + "end": 54.2, + "confidence": 0.555 + }, + { + "text": "autumn", + "start": 54.2, + "end": 54.4, + "confidence": 0.159 + }, + { + "text": "to", + "start": 54.4, + "end": 54.64, + "confidence": 0.186 + }, + { + "text": "heal", + "start": 54.64, + "end": 55.18, + "confidence": 0.129 + }, + { + "text": "up.", + "start": 55.18, + "end": 56.06, + "confidence": 0.817 + } + ] + }, + { + "id": 34, + "seek": 5300, + "start": 56.46, + "end": 57.86, + "text": " You won't hack me on this.", + "tokens": [ + 509, + 1582, + 380, + 10339, + 385, + 322, + 341, + 13 + ], + "temperature": 0.4, + "avg_logprob": -0.7040317565437377, + "compression_ratio": 1.7253218884120172, + "no_speech_prob": 0.4773952066898346, + "confidence": 0.432, + "words": [ + { + "text": "You", + "start": 56.46, + "end": 56.8, + "confidence": 0.117 + }, + { + "text": "won't", + "start": 56.8, + "end": 57.2, + "confidence": 0.465 + }, + { + "text": "hack", + "start": 57.2, + "end": 57.46, + "confidence": 0.373 + }, + { + "text": "me", + "start": 57.46, + "end": 57.66, + "confidence": 0.898 + }, + { + "text": "on", + "start": 57.66, + "end": 57.82, + "confidence": 0.807 + }, + { + "text": "this.", + "start": 57.82, + "end": 57.86, + "confidence": 0.413 + } + ] + }, + { + "id": 35, + "seek": 5300, + "start": 57.86, + "end": 59.79, + "text": " You won't hack me on this.", + "tokens": [ + 509, + 1582, + 380, + 10339, + 385, + 322, + 341, + 13 + ], + "temperature": 0.4, + "avg_logprob": -0.7040317565437377, + "compression_ratio": 1.7253218884120172, + "no_speech_prob": 0.4773952066898346, + "confidence": 0.832, + "words": [ + { + "text": "You", + "start": 57.86, + "end": 58.08, + "confidence": 0.612 + }, + { + "text": "won't", + "start": 58.08, + "end": 58.76, + "confidence": 0.928 + }, + { + "text": "hack", + "start": 58.76, + "end": 58.8, + "confidence": 0.809 + }, + { + "text": "me", + "start": 58.8, + "end": 59.2, + "confidence": 0.905 + }, + { + "text": "on", + "start": 59.2, + "end": 59.3, + "confidence": 0.884 + }, + { + "text": "this.", + "start": 59.3, + "end": 59.79, + "confidence": 0.808 + } + ] + }, + { + "id": 36, + "seek": 5300, + "start": 59.79, + "end": 62.08, + "text": " With a cover, I tried it already.", + "tokens": [ + 2022, + 257, + 2060, + 11, + 286, + 3031, + 309, + 1217, + 13 + ], + "temperature": 0.4, + "avg_logprob": -0.7040317565437377, + "compression_ratio": 1.7253218884120172, + "no_speech_prob": 0.4773952066898346, + "confidence": 0.638, + "words": [ + { + "text": "With", + "start": 59.79, + "end": 60.1, + "confidence": 0.363 + }, + { + "text": "a", + "start": 60.1, + "end": 60.14, + "confidence": 0.405 + }, + { + "text": "cover,", + "start": 60.14, + "end": 61.24, + "confidence": 0.814 + }, + { + "text": "I", + "start": 61.24, + "end": 61.28, + "confidence": 0.961 + }, + { + "text": "tried", + "start": 61.28, + "end": 61.56, + "confidence": 0.653 + }, + { + "text": "it", + "start": 61.56, + "end": 61.74, + "confidence": 0.73 + }, + { + "text": "already.", + "start": 61.74, + "end": 62.08, + "confidence": 0.785 + } + ] + }, + { + "id": 37, + "seek": 5300, + "start": 62.6, + "end": 65.32, + "text": " Okay, fine. We weren't sure that this was a suggestion.", + "tokens": [ + 1033, + 11, + 2489, + 13, + 492, + 4999, + 380, + 988, + 300, + 341, + 390, + 257, + 16541, + 13 + ], + "temperature": 0.4, + "avg_logprob": -0.7040317565437377, + "compression_ratio": 1.7253218884120172, + "no_speech_prob": 0.4773952066898346, + "confidence": 0.722, + "words": [ + { + "text": "Okay,", + "start": 62.6, + "end": 62.92, + "confidence": 0.513 + }, + { + "text": "fine.", + "start": 62.92, + "end": 63.2, + "confidence": 0.861 + }, + { + "text": "We", + "start": 63.2, + "end": 63.36, + "confidence": 0.702 + }, + { + "text": "weren't", + "start": 63.36, + "end": 63.68, + "confidence": 0.909 + }, + { + "text": "sure", + "start": 63.68, + "end": 63.84, + "confidence": 0.829 + }, + { + "text": "that", + "start": 63.84, + "end": 64.24, + "confidence": 0.552 + }, + { + "text": "this", + "start": 64.24, + "end": 64.64, + "confidence": 0.741 + }, + { + "text": "was", + "start": 64.64, + "end": 64.8, + "confidence": 0.783 + }, + { + "text": "a", + "start": 64.8, + "end": 64.88, + "confidence": 0.819 + }, + { + "text": "suggestion.", + "start": 64.88, + "end": 65.32, + "confidence": 0.498 + } + ] + }, + { + "id": 38, + "seek": 5300, + "start": 66.76, + "end": 68.21, + "text": " We thought you could check it out.", + "tokens": [ + 492, + 1194, + 291, + 727, + 1520, + 309, + 484, + 13 + ], + "temperature": 0.4, + "avg_logprob": -0.7040317565437377, + "compression_ratio": 1.7253218884120172, + "no_speech_prob": 0.4773952066898346, + "confidence": 0.721, + "words": [ + { + "text": "We", + "start": 66.76, + "end": 66.8, + "confidence": 0.891 + }, + { + "text": "thought", + "start": 66.8, + "end": 66.84, + "confidence": 0.813 + }, + { + "text": "you", + "start": 66.84, + "end": 67.06, + "confidence": 0.325 + }, + { + "text": "could", + "start": 67.06, + "end": 67.24, + "confidence": 0.784 + }, + { + "text": "check", + "start": 67.24, + "end": 67.5, + "confidence": 0.751 + }, + { + "text": "it", + "start": 67.5, + "end": 67.7, + "confidence": 0.899 + }, + { + "text": "out.", + "start": 67.7, + "end": 68.21, + "confidence": 0.812 + } + ] + }, + { + "id": 39, + "seek": 5300, + "start": 68.21, + "end": 69.48, + "text": " I'm not sure we've already done that.", + "tokens": [ + 286, + 478, + 406, + 988, + 321, + 600, + 1217, + 1096, + 300, + 13 + ], + "temperature": 0.4, + "avg_logprob": -0.7040317565437377, + "compression_ratio": 1.7253218884120172, + "no_speech_prob": 0.4773952066898346, + "confidence": 0.455, + "words": [ + { + "text": "I'm", + "start": 68.21, + "end": 68.5, + "confidence": 0.179 + }, + { + "text": "not", + "start": 68.5, + "end": 68.6, + "confidence": 0.258 + }, + { + "text": "sure", + "start": 68.6, + "end": 68.76, + "confidence": 0.761 + }, + { + "text": "we've", + "start": 68.76, + "end": 68.9, + "confidence": 0.495 + }, + { + "text": "already", + "start": 68.9, + "end": 68.94, + "confidence": 0.765 + }, + { + "text": "done", + "start": 68.94, + "end": 69.18, + "confidence": 0.799 + }, + { + "text": "that.", + "start": 69.18, + "end": 69.48, + "confidence": 0.878 + } + ] + }, + { + "id": 40, + "seek": 5300, + "start": 70.38, + "end": 72.62, + "text": " I guess, whatever you come up with, just let us know.", + "tokens": [ + 286, + 2041, + 11, + 2035, + 291, + 808, + 493, + 365, + 11, + 445, + 718, + 505, + 458, + 13 + ], + "temperature": 0.4, + "avg_logprob": -0.7040317565437377, + "compression_ratio": 1.7253218884120172, + "no_speech_prob": 0.4773952066898346, + "confidence": 0.738, + "words": [ + { + "text": "I", + "start": 70.38, + "end": 70.52, + "confidence": 0.55 + }, + { + "text": "guess,", + "start": 70.52, + "end": 70.96, + "confidence": 0.903 + }, + { + "text": "whatever", + "start": 70.96, + "end": 71.18, + "confidence": 0.404 + }, + { + "text": "you", + "start": 71.18, + "end": 71.22, + "confidence": 0.89 + }, + { + "text": "come", + "start": 71.22, + "end": 71.54, + "confidence": 0.544 + }, + { + "text": "up", + "start": 71.54, + "end": 71.72, + "confidence": 0.892 + }, + { + "text": "with,", + "start": 71.72, + "end": 71.98, + "confidence": 0.816 + }, + { + "text": "just", + "start": 71.98, + "end": 72.16, + "confidence": 0.77 + }, + { + "text": "let", + "start": 72.16, + "end": 72.2, + "confidence": 0.898 + }, + { + "text": "us", + "start": 72.2, + "end": 72.34, + "confidence": 0.905 + }, + { + "text": "know.", + "start": 72.34, + "end": 72.62, + "confidence": 0.798 + } + ] + }, + { + "id": 41, + "seek": 5300, + "start": 74.18, + "end": 75.48, + "text": " Okay, no problem.", + "tokens": [ + 1033, + 11, + 572, + 1154, + 13 + ], + "temperature": 0.4, + "avg_logprob": -0.7040317565437377, + "compression_ratio": 1.7253218884120172, + "no_speech_prob": 0.4773952066898346, + "confidence": 0.699, + "words": [ + { + "text": "Okay,", + "start": 74.18, + "end": 74.66, + "confidence": 0.789 + }, + { + "text": "no", + "start": 74.66, + "end": 74.88, + "confidence": 0.548 + }, + { + "text": "problem.", + "start": 74.88, + "end": 75.48, + "confidence": 0.79 + } + ] + }, + { + "id": 42, + "seek": 7544, + "start": 75.48, + "end": 76.86, + "text": " Okay, no problem.", + "tokens": [ + 50364, + 1033, + 11, + 572, + 1154, + 13, + 50464 + ], + "temperature": 0.4, + "avg_logprob": -0.7493470907211304, + "compression_ratio": 0.68, + "no_speech_prob": 0.06937140226364136, + "confidence": 0.521, + "words": [ + { + "text": "Okay,", + "start": 75.48, + "end": 76.28, + "confidence": 0.386 + }, + { + "text": "no", + "start": 76.28, + "end": 76.32, + "confidence": 0.472 + }, + { + "text": "problem.", + "start": 76.32, + "end": 76.86, + "confidence": 0.775 + } + ] + } + ], + "language": "en" +} \ No newline at end of file diff --git a/tests/expected/corner_cases.cpu/nocond.random_music.mp4.words.json b/tests/expected/corner_cases.cpu/nocond.random_music.mp4.words.json new file mode 100644 index 0000000000000000000000000000000000000000..cffe4045f2a305e00267c28fb344c5011039e8b1 --- /dev/null +++ b/tests/expected/corner_cases.cpu/nocond.random_music.mp4.words.json @@ -0,0 +1,3209 @@ +{ + "text": " I Oh, the misery Everybody wants to be my enemy Spare the sympathy Everybody wants to be my enemy Look out for yourself My enemy Look out for yourself But I'm ready Your words up on the wall You don't need to say I'm ready your words up on the wall as you're praying for my phone and the laughter in the holes and the names that I've I stack it in my mind and I'm waiting for the time When I show you what it's like to be worse than a mind Tell you you're the greatest But once you turn they hate us Oh, the misery Everybody wants to be my enemy I smell the sympathy Everybody wants to be my enemy Look out for yourself My enemy Look out for yourself Look, okay I'm hoping that somebody pray for me I'm praying that somebody vote for me I'm staying where nobody's supposed to be I propose to be in a rink of emotions Ready to go whenever you let me know The road is long so put the pedal into the flow The enemy on my trail, my energy unavailable I'm a tell a monster the way go Way when the plot on my track to the top I been out of shape thinking that I'm a box I'm an astronaut Blast it off the planet rock the cause catastrophe And it matters more because ahead and not ahead I thought about wreaking havoc on an opposition Kinda shockin' they want it static with precision I'm automatic quarterback I ain't talkin' second Pack it pack it up I don't panic Better batter up who the baddest It don't matter cause we it's your Everybody wants to be my enemy Spare the sympathy Everybody wants to be my enemy Oh the misery Everybody wants to be my enemy Spare the sympathy Everybody wants to be my enemy I swear, I swear I'll never be a saint I swear, my enemy I swear, I swear I'll never be a saint You got to be yourself!", + "segments": [ + { + "id": 0, + "seek": 0, + "start": 0.02, + "end": 0.4, + "text": " I", + "tokens": [ + 50364, + 286, + 50464 + ], + "temperature": 0.4, + "avg_logprob": -0.9367842674255371, + "compression_ratio": 0.1111111111111111, + "no_speech_prob": 0.7794302701950073, + "confidence": 0.032, + "words": [ + { + "text": "I", + "start": 0.02, + "end": 0.4, + "confidence": 0.032 + } + ] + }, + { + "id": 1, + "seek": 6000, + "start": 60.02, + "end": 68.54, + "text": " Oh, the misery Everybody wants to be my enemy", + "tokens": [ + 876, + 11, + 264, + 32309, + 7646, + 2738, + 281, + 312, + 452, + 5945 + ], + "temperature": 0.4, + "avg_logprob": -0.7892291628081223, + "compression_ratio": 1.627906976744186, + "no_speech_prob": 0.8689420819282532, + "confidence": 0.669, + "words": [ + { + "text": "Oh,", + "start": 60.02, + "end": 65.44, + "confidence": 0.084 + }, + { + "text": "the", + "start": 65.44, + "end": 65.48, + "confidence": 0.796 + }, + { + "text": "misery", + "start": 65.48, + "end": 66.08, + "confidence": 0.993 + }, + { + "text": "Everybody", + "start": 66.08, + "end": 67.62, + "confidence": 0.431 + }, + { + "text": "wants", + "start": 67.62, + "end": 68.0, + "confidence": 0.983 + }, + { + "text": "to", + "start": 68.0, + "end": 68.18, + "confidence": 0.993 + }, + { + "text": "be", + "start": 68.18, + "end": 68.38, + "confidence": 0.996 + }, + { + "text": "my", + "start": 68.38, + "end": 68.5, + "confidence": 0.984 + }, + { + "text": "enemy", + "start": 68.5, + "end": 68.54, + "confidence": 0.984 + } + ] + }, + { + "id": 2, + "seek": 6000, + "start": 70.9, + "end": 75.92, + "text": " Spare the sympathy Everybody wants to be my enemy", + "tokens": [ + 1738, + 543, + 264, + 33240, + 7646, + 2738, + 281, + 312, + 452, + 5945 + ], + "temperature": 0.4, + "avg_logprob": -0.7892291628081223, + "compression_ratio": 1.627906976744186, + "no_speech_prob": 0.8689420819282532, + "confidence": 0.932, + "words": [ + { + "text": "Spare", + "start": 70.9, + "end": 71.48, + "confidence": 0.789 + }, + { + "text": "the", + "start": 71.48, + "end": 71.7, + "confidence": 0.97 + }, + { + "text": "sympathy", + "start": 71.7, + "end": 72.56, + "confidence": 0.993 + }, + { + "text": "Everybody", + "start": 72.56, + "end": 73.86, + "confidence": 0.959 + }, + { + "text": "wants", + "start": 73.86, + "end": 74.26, + "confidence": 0.994 + }, + { + "text": "to", + "start": 74.26, + "end": 74.42, + "confidence": 0.998 + }, + { + "text": "be", + "start": 74.42, + "end": 75.16, + "confidence": 0.999 + }, + { + "text": "my", + "start": 75.16, + "end": 75.64, + "confidence": 0.869 + }, + { + "text": "enemy", + "start": 75.64, + "end": 75.92, + "confidence": 0.997 + } + ] + }, + { + "id": 3, + "seek": 6000, + "start": 79.98, + "end": 80.5, + "text": " Look out for yourself My enemy", + "tokens": [ + 2053, + 484, + 337, + 1803, + 1222, + 5945 + ], + "temperature": 0.4, + "avg_logprob": -0.7892291628081223, + "compression_ratio": 1.627906976744186, + "no_speech_prob": 0.8689420819282532, + "confidence": 0.778, + "words": [ + { + "text": "Look", + "start": 79.98, + "end": 80.12, + "confidence": 0.446 + }, + { + "text": "out", + "start": 80.12, + "end": 80.34, + "confidence": 0.99 + }, + { + "text": "for", + "start": 80.34, + "end": 80.38, + "confidence": 0.991 + }, + { + "text": "yourself", + "start": 80.38, + "end": 80.42, + "confidence": 0.971 + }, + { + "text": "My", + "start": 80.42, + "end": 80.46, + "confidence": 0.533 + }, + { + "text": "enemy", + "start": 80.46, + "end": 80.5, + "confidence": 0.979 + } + ] + }, + { + "id": 4, + "seek": 6000, + "start": 80.5, + "end": 81.28, + "text": " Look out for yourself But I'm ready", + "tokens": [ + 2053, + 484, + 337, + 1803, + 583, + 286, + 478, + 1919 + ], + "temperature": 0.4, + "avg_logprob": -0.7892291628081223, + "compression_ratio": 1.627906976744186, + "no_speech_prob": 0.8689420819282532, + "confidence": 0.943, + "words": [ + { + "text": "Look", + "start": 80.5, + "end": 80.54, + "confidence": 0.844 + }, + { + "text": "out", + "start": 80.54, + "end": 80.58, + "confidence": 0.994 + }, + { + "text": "for", + "start": 80.58, + "end": 80.62, + "confidence": 0.999 + }, + { + "text": "yourself", + "start": 80.62, + "end": 80.66, + "confidence": 0.999 + }, + { + "text": "But", + "start": 80.66, + "end": 80.7, + "confidence": 0.767 + }, + { + "text": "I'm", + "start": 80.7, + "end": 81.04, + "confidence": 0.99 + }, + { + "text": "ready", + "start": 81.04, + "end": 81.28, + "confidence": 0.996 + } + ] + }, + { + "id": 5, + "seek": 6000, + "start": 86.14, + "end": 88.28, + "text": " Your words up on the wall You don't need to say", + "tokens": [ + 2260, + 2283, + 493, + 322, + 264, + 2929, + 509, + 500, + 380, + 643, + 281, + 584 + ], + "temperature": 0.4, + "avg_logprob": -0.7892291628081223, + "compression_ratio": 1.627906976744186, + "no_speech_prob": 0.8689420819282532, + "confidence": 0.361, + "words": [ + { + "text": "Your", + "start": 86.14, + "end": 86.4, + "confidence": 0.618 + }, + { + "text": "words", + "start": 86.4, + "end": 86.44, + "confidence": 0.786 + }, + { + "text": "up", + "start": 86.44, + "end": 86.7, + "confidence": 0.891 + }, + { + "text": "on", + "start": 86.7, + "end": 86.98, + "confidence": 0.996 + }, + { + "text": "the", + "start": 86.98, + "end": 87.1, + "confidence": 0.985 + }, + { + "text": "wall", + "start": 87.1, + "end": 87.62, + "confidence": 0.711 + }, + { + "text": "You", + "start": 87.62, + "end": 87.92, + "confidence": 0.084 + }, + { + "text": "don't", + "start": 87.92, + "end": 88.16, + "confidence": 0.172 + }, + { + "text": "need", + "start": 88.16, + "end": 88.2, + "confidence": 0.149 + }, + { + "text": "to", + "start": 88.2, + "end": 88.24, + "confidence": 0.466 + }, + { + "text": "say", + "start": 88.24, + "end": 88.28, + "confidence": 0.094 + } + ] + }, + { + "id": 6, + "seek": 8774, + "start": 88.28, + "end": 94.25, + "text": " I'm ready your words up on the wall as you're praying for my phone and the laughter in the holes and the names that I've", + "tokens": [ + 286, + 478, + 1919, + 428, + 2283, + 493, + 322, + 264, + 2929, + 382, + 291, + 434, + 15611, + 337, + 452, + 2593, + 293, + 264, + 13092, + 294, + 264, + 8118, + 293, + 264, + 5288, + 300, + 286, + 600 + ], + "temperature": 0.4, + "avg_logprob": -0.26142611746060646, + "compression_ratio": 1.486842105263158, + "no_speech_prob": 0.8554685115814209, + "confidence": 0.773, + "words": [ + { + "text": "I'm", + "start": 88.28, + "end": 88.32, + "confidence": 0.459 + }, + { + "text": "ready", + "start": 88.32, + "end": 88.52, + "confidence": 0.976 + }, + { + "text": "your", + "start": 88.52, + "end": 88.9, + "confidence": 0.592 + }, + { + "text": "words", + "start": 88.9, + "end": 89.14, + "confidence": 0.987 + }, + { + "text": "up", + "start": 89.14, + "end": 89.46, + "confidence": 0.974 + }, + { + "text": "on", + "start": 89.46, + "end": 89.6, + "confidence": 0.979 + }, + { + "text": "the", + "start": 89.6, + "end": 89.66, + "confidence": 0.985 + }, + { + "text": "wall", + "start": 89.66, + "end": 90.12, + "confidence": 0.45 + }, + { + "text": "as", + "start": 90.12, + "end": 90.32, + "confidence": 0.489 + }, + { + "text": "you're", + "start": 90.32, + "end": 90.64, + "confidence": 0.817 + }, + { + "text": "praying", + "start": 90.64, + "end": 90.8, + "confidence": 0.962 + }, + { + "text": "for", + "start": 90.8, + "end": 91.06, + "confidence": 0.956 + }, + { + "text": "my", + "start": 91.06, + "end": 91.26, + "confidence": 0.965 + }, + { + "text": "phone", + "start": 91.26, + "end": 91.72, + "confidence": 0.63 + }, + { + "text": "and", + "start": 91.72, + "end": 91.9, + "confidence": 0.687 + }, + { + "text": "the", + "start": 91.9, + "end": 92.0, + "confidence": 0.948 + }, + { + "text": "laughter", + "start": 92.0, + "end": 92.36, + "confidence": 0.87 + }, + { + "text": "in", + "start": 92.36, + "end": 92.72, + "confidence": 0.905 + }, + { + "text": "the", + "start": 92.72, + "end": 92.88, + "confidence": 0.982 + }, + { + "text": "holes", + "start": 92.88, + "end": 93.24, + "confidence": 0.593 + }, + { + "text": "and", + "start": 93.24, + "end": 93.44, + "confidence": 0.6 + }, + { + "text": "the", + "start": 93.44, + "end": 93.52, + "confidence": 0.983 + }, + { + "text": "names", + "start": 93.52, + "end": 93.82, + "confidence": 0.98 + }, + { + "text": "that", + "start": 93.82, + "end": 94.08, + "confidence": 0.827 + }, + { + "text": "I've", + "start": 94.08, + "end": 94.25, + "confidence": 0.75 + } + ] + }, + { + "id": 7, + "seek": 9418, + "start": 94.25, + "end": 97.84, + "text": " I stack it in my mind and I'm waiting for the time", + "tokens": [ + 286, + 8630, + 309, + 294, + 452, + 1575, + 293, + 286, + 478, + 3806, + 337, + 264, + 565 + ], + "temperature": 0.4, + "avg_logprob": -0.4302098981795772, + "compression_ratio": 1.388157894736842, + "no_speech_prob": 0.8590295314788818, + "confidence": 0.764, + "words": [ + { + "text": "I", + "start": 94.25, + "end": 95.04, + "confidence": 0.29 + }, + { + "text": "stack", + "start": 95.04, + "end": 95.38, + "confidence": 0.341 + }, + { + "text": "it", + "start": 95.38, + "end": 95.7, + "confidence": 0.988 + }, + { + "text": "in", + "start": 95.7, + "end": 95.82, + "confidence": 0.987 + }, + { + "text": "my", + "start": 95.82, + "end": 96.02, + "confidence": 0.99 + }, + { + "text": "mind", + "start": 96.02, + "end": 96.42, + "confidence": 0.99 + }, + { + "text": "and", + "start": 96.42, + "end": 96.62, + "confidence": 0.382 + }, + { + "text": "I'm", + "start": 96.62, + "end": 96.72, + "confidence": 0.964 + }, + { + "text": "waiting", + "start": 96.72, + "end": 97.02, + "confidence": 0.952 + }, + { + "text": "for", + "start": 97.02, + "end": 97.34, + "confidence": 0.972 + }, + { + "text": "the", + "start": 97.34, + "end": 97.5, + "confidence": 0.986 + }, + { + "text": "time", + "start": 97.5, + "end": 97.84, + "confidence": 0.985 + } + ] + }, + { + "id": 8, + "seek": 9418, + "start": 98.0, + "end": 101.24, + "text": " When I show you what it's like to be worse than a mind", + "tokens": [ + 1133, + 286, + 855, + 291, + 437, + 309, + 311, + 411, + 281, + 312, + 5324, + 813, + 257, + 1575 + ], + "temperature": 0.4, + "avg_logprob": -0.4302098981795772, + "compression_ratio": 1.388157894736842, + "no_speech_prob": 0.8590295314788818, + "confidence": 0.655, + "words": [ + { + "text": "When", + "start": 98.0, + "end": 98.18, + "confidence": 0.768 + }, + { + "text": "I", + "start": 98.18, + "end": 98.22, + "confidence": 0.989 + }, + { + "text": "show", + "start": 98.22, + "end": 98.48, + "confidence": 0.931 + }, + { + "text": "you", + "start": 98.48, + "end": 98.76, + "confidence": 0.988 + }, + { + "text": "what", + "start": 98.76, + "end": 98.94, + "confidence": 0.991 + }, + { + "text": "it's", + "start": 98.94, + "end": 99.42, + "confidence": 0.981 + }, + { + "text": "like", + "start": 99.42, + "end": 99.46, + "confidence": 0.997 + }, + { + "text": "to", + "start": 99.46, + "end": 99.72, + "confidence": 0.681 + }, + { + "text": "be", + "start": 99.72, + "end": 99.78, + "confidence": 0.995 + }, + { + "text": "worse", + "start": 99.78, + "end": 100.04, + "confidence": 0.659 + }, + { + "text": "than", + "start": 100.04, + "end": 100.36, + "confidence": 0.173 + }, + { + "text": "a", + "start": 100.36, + "end": 100.6, + "confidence": 0.112 + }, + { + "text": "mind", + "start": 100.6, + "end": 101.24, + "confidence": 0.463 + } + ] + }, + { + "id": 9, + "seek": 9418, + "start": 102.06, + "end": 106.28, + "text": " Tell you you're the greatest", + "tokens": [ + 5115, + 291, + 291, + 434, + 264, + 6636 + ], + "temperature": 0.4, + "avg_logprob": -0.4302098981795772, + "compression_ratio": 1.388157894736842, + "no_speech_prob": 0.8590295314788818, + "confidence": 0.919, + "words": [ + { + "text": "Tell", + "start": 102.06, + "end": 102.1, + "confidence": 0.861 + }, + { + "text": "you", + "start": 102.1, + "end": 102.72, + "confidence": 0.991 + }, + { + "text": "you're", + "start": 102.72, + "end": 103.66, + "confidence": 0.855 + }, + { + "text": "the", + "start": 103.66, + "end": 104.1, + "confidence": 0.985 + }, + { + "text": "greatest", + "start": 104.1, + "end": 106.28, + "confidence": 0.978 + } + ] + }, + { + "id": 10, + "seek": 9418, + "start": 107.14, + "end": 112.98, + "text": " But once you turn they hate us", + "tokens": [ + 583, + 1564, + 291, + 1261, + 436, + 4700, + 505 + ], + "temperature": 0.4, + "avg_logprob": -0.4302098981795772, + "compression_ratio": 1.388157894736842, + "no_speech_prob": 0.8590295314788818, + "confidence": 0.893, + "words": [ + { + "text": "But", + "start": 107.14, + "end": 107.54, + "confidence": 0.976 + }, + { + "text": "once", + "start": 107.54, + "end": 108.38, + "confidence": 0.799 + }, + { + "text": "you", + "start": 108.38, + "end": 108.92, + "confidence": 0.998 + }, + { + "text": "turn", + "start": 108.92, + "end": 109.84, + "confidence": 0.889 + }, + { + "text": "they", + "start": 109.84, + "end": 110.4, + "confidence": 0.662 + }, + { + "text": "hate", + "start": 110.4, + "end": 111.88, + "confidence": 0.99 + }, + { + "text": "us", + "start": 111.88, + "end": 112.98, + "confidence": 0.999 + } + ] + }, + { + "id": 11, + "seek": 9418, + "start": 114.54, + "end": 119.18, + "text": " Oh, the misery Everybody wants to be my enemy", + "tokens": [ + 876, + 11, + 264, + 32309, + 7646, + 2738, + 281, + 312, + 452, + 5945 + ], + "temperature": 0.4, + "avg_logprob": -0.4302098981795772, + "compression_ratio": 1.388157894736842, + "no_speech_prob": 0.8590295314788818, + "confidence": 0.874, + "words": [ + { + "text": "Oh,", + "start": 114.54, + "end": 115.32, + "confidence": 0.74 + }, + { + "text": "the", + "start": 115.32, + "end": 115.36, + "confidence": 0.97 + }, + { + "text": "misery", + "start": 115.36, + "end": 116.36, + "confidence": 0.999 + }, + { + "text": "Everybody", + "start": 116.36, + "end": 117.52, + "confidence": 0.432 + }, + { + "text": "wants", + "start": 117.52, + "end": 117.9, + "confidence": 0.989 + }, + { + "text": "to", + "start": 117.9, + "end": 118.24, + "confidence": 0.998 + }, + { + "text": "be", + "start": 118.24, + "end": 118.28, + "confidence": 0.998 + }, + { + "text": "my", + "start": 118.28, + "end": 118.54, + "confidence": 0.997 + }, + { + "text": "enemy", + "start": 118.54, + "end": 119.18, + "confidence": 0.984 + } + ] + }, + { + "id": 12, + "seek": 12018, + "start": 120.2, + "end": 122.16, + "text": " I smell the sympathy", + "tokens": [ + 286, + 4316, + 264, + 33240 + ], + "temperature": 0.4, + "avg_logprob": -0.3580510299817651, + "compression_ratio": 1.7621145374449338, + "no_speech_prob": 0.8322692513465881, + "confidence": 0.755, + "words": [ + { + "text": "I", + "start": 120.2, + "end": 120.54, + "confidence": 0.42 + }, + { + "text": "smell", + "start": 120.54, + "end": 121.36, + "confidence": 0.889 + }, + { + "text": "the", + "start": 121.36, + "end": 121.76, + "confidence": 0.892 + }, + { + "text": "sympathy", + "start": 121.76, + "end": 122.16, + "confidence": 0.979 + } + ] + }, + { + "id": 13, + "seek": 12018, + "start": 122.16, + "end": 126.08, + "text": " Everybody wants to be my enemy", + "tokens": [ + 7646, + 2738, + 281, + 312, + 452, + 5945 + ], + "temperature": 0.4, + "avg_logprob": -0.3580510299817651, + "compression_ratio": 1.7621145374449338, + "no_speech_prob": 0.8322692513465881, + "confidence": 0.912, + "words": [ + { + "text": "Everybody", + "start": 122.16, + "end": 123.72, + "confidence": 0.923 + }, + { + "text": "wants", + "start": 123.72, + "end": 124.1, + "confidence": 0.984 + }, + { + "text": "to", + "start": 124.1, + "end": 124.68, + "confidence": 0.995 + }, + { + "text": "be", + "start": 124.68, + "end": 125.24, + "confidence": 0.996 + }, + { + "text": "my", + "start": 125.24, + "end": 125.5, + "confidence": 0.659 + }, + { + "text": "enemy", + "start": 125.5, + "end": 126.08, + "confidence": 0.97 + } + ] + }, + { + "id": 14, + "seek": 12018, + "start": 129.9, + "end": 130.86, + "text": " Look out for yourself", + "tokens": [ + 2053, + 484, + 337, + 1803 + ], + "temperature": 0.4, + "avg_logprob": -0.3580510299817651, + "compression_ratio": 1.7621145374449338, + "no_speech_prob": 0.8322692513465881, + "confidence": 0.731, + "words": [ + { + "text": "Look", + "start": 129.9, + "end": 130.04, + "confidence": 0.313 + }, + { + "text": "out", + "start": 130.04, + "end": 130.3, + "confidence": 0.932 + }, + { + "text": "for", + "start": 130.3, + "end": 130.44, + "confidence": 0.991 + }, + { + "text": "yourself", + "start": 130.44, + "end": 130.86, + "confidence": 0.986 + } + ] + }, + { + "id": 15, + "seek": 12018, + "start": 131.52, + "end": 132.54, + "text": " My enemy", + "tokens": [ + 1222, + 5945 + ], + "temperature": 0.4, + "avg_logprob": -0.3580510299817651, + "compression_ratio": 1.7621145374449338, + "no_speech_prob": 0.8322692513465881, + "confidence": 0.937, + "words": [ + { + "text": "My", + "start": 131.52, + "end": 131.74, + "confidence": 0.891 + }, + { + "text": "enemy", + "start": 131.74, + "end": 132.54, + "confidence": 0.985 + } + ] + }, + { + "id": 16, + "seek": 12018, + "start": 136.06, + "end": 137.14, + "text": " Look out for yourself", + "tokens": [ + 2053, + 484, + 337, + 1803 + ], + "temperature": 0.4, + "avg_logprob": -0.3580510299817651, + "compression_ratio": 1.7621145374449338, + "no_speech_prob": 0.8322692513465881, + "confidence": 0.991, + "words": [ + { + "text": "Look", + "start": 136.06, + "end": 136.18, + "confidence": 0.974 + }, + { + "text": "out", + "start": 136.18, + "end": 136.54, + "confidence": 0.994 + }, + { + "text": "for", + "start": 136.54, + "end": 136.74, + "confidence": 0.999 + }, + { + "text": "yourself", + "start": 136.74, + "end": 137.14, + "confidence": 0.999 + } + ] + }, + { + "id": 17, + "seek": 12018, + "start": 137.66, + "end": 140.18, + "text": " Look, okay I'm hoping that somebody pray for me", + "tokens": [ + 2053, + 11, + 1392, + 286, + 478, + 7159, + 300, + 2618, + 3690, + 337, + 385 + ], + "temperature": 0.4, + "avg_logprob": -0.3580510299817651, + "compression_ratio": 1.7621145374449338, + "no_speech_prob": 0.8322692513465881, + "confidence": 0.792, + "words": [ + { + "text": "Look,", + "start": 137.66, + "end": 138.46, + "confidence": 0.849 + }, + { + "text": "okay", + "start": 138.46, + "end": 138.6, + "confidence": 0.646 + }, + { + "text": "I'm", + "start": 138.6, + "end": 138.86, + "confidence": 0.658 + }, + { + "text": "hoping", + "start": 138.86, + "end": 139.12, + "confidence": 0.576 + }, + { + "text": "that", + "start": 139.12, + "end": 139.32, + "confidence": 0.958 + }, + { + "text": "somebody", + "start": 139.32, + "end": 139.52, + "confidence": 0.975 + }, + { + "text": "pray", + "start": 139.52, + "end": 139.8, + "confidence": 0.85 + }, + { + "text": "for", + "start": 139.8, + "end": 140.02, + "confidence": 0.899 + }, + { + "text": "me", + "start": 140.02, + "end": 140.18, + "confidence": 0.999 + } + ] + }, + { + "id": 18, + "seek": 12018, + "start": 140.38, + "end": 141.64, + "text": " I'm praying that somebody vote for me", + "tokens": [ + 286, + 478, + 15611, + 300, + 2618, + 4740, + 337, + 385 + ], + "temperature": 0.4, + "avg_logprob": -0.3580510299817651, + "compression_ratio": 1.7621145374449338, + "no_speech_prob": 0.8322692513465881, + "confidence": 0.821, + "words": [ + { + "text": "I'm", + "start": 140.38, + "end": 140.58, + "confidence": 0.756 + }, + { + "text": "praying", + "start": 140.58, + "end": 140.62, + "confidence": 0.956 + }, + { + "text": "that", + "start": 140.62, + "end": 140.82, + "confidence": 0.959 + }, + { + "text": "somebody", + "start": 140.82, + "end": 141.06, + "confidence": 0.995 + }, + { + "text": "vote", + "start": 141.06, + "end": 141.32, + "confidence": 0.396 + }, + { + "text": "for", + "start": 141.32, + "end": 141.52, + "confidence": 0.999 + }, + { + "text": "me", + "start": 141.52, + "end": 141.64, + "confidence": 1.0 + } + ] + }, + { + "id": 19, + "seek": 12018, + "start": 141.72, + "end": 143.2, + "text": " I'm staying where nobody's supposed to be", + "tokens": [ + 286, + 478, + 7939, + 689, + 5079, + 311, + 3442, + 281, + 312 + ], + "temperature": 0.4, + "avg_logprob": -0.3580510299817651, + "compression_ratio": 1.7621145374449338, + "no_speech_prob": 0.8322692513465881, + "confidence": 0.893, + "words": [ + { + "text": "I'm", + "start": 141.72, + "end": 141.9, + "confidence": 0.937 + }, + { + "text": "staying", + "start": 141.9, + "end": 142.12, + "confidence": 0.82 + }, + { + "text": "where", + "start": 142.12, + "end": 142.3, + "confidence": 0.976 + }, + { + "text": "nobody's", + "start": 142.3, + "end": 142.88, + "confidence": 0.735 + }, + { + "text": "supposed", + "start": 142.88, + "end": 142.92, + "confidence": 0.957 + }, + { + "text": "to", + "start": 142.92, + "end": 143.12, + "confidence": 0.998 + }, + { + "text": "be", + "start": 143.12, + "end": 143.2, + "confidence": 0.999 + } + ] + }, + { + "id": 20, + "seek": 12018, + "start": 143.2, + "end": 144.86, + "text": " I propose to be in a rink of emotions", + "tokens": [ + 286, + 17421, + 281, + 312, + 294, + 257, + 367, + 475, + 295, + 8462 + ], + "temperature": 0.4, + "avg_logprob": -0.3580510299817651, + "compression_ratio": 1.7621145374449338, + "no_speech_prob": 0.8322692513465881, + "confidence": 0.554, + "words": [ + { + "text": "I", + "start": 143.2, + "end": 143.36, + "confidence": 0.354 + }, + { + "text": "propose", + "start": 143.36, + "end": 143.64, + "confidence": 0.323 + }, + { + "text": "to", + "start": 143.64, + "end": 143.86, + "confidence": 0.856 + }, + { + "text": "be", + "start": 143.86, + "end": 144.04, + "confidence": 0.579 + }, + { + "text": "in", + "start": 144.04, + "end": 144.18, + "confidence": 0.837 + }, + { + "text": "a", + "start": 144.18, + "end": 144.24, + "confidence": 0.631 + }, + { + "text": "rink", + "start": 144.24, + "end": 144.42, + "confidence": 0.309 + }, + { + "text": "of", + "start": 144.42, + "end": 144.54, + "confidence": 0.996 + }, + { + "text": "emotions", + "start": 144.54, + "end": 144.86, + "confidence": 0.952 + } + ] + }, + { + "id": 21, + "seek": 12018, + "start": 145.06, + "end": 146.28, + "text": " Ready to go whenever you let me know", + "tokens": [ + 9944, + 281, + 352, + 5699, + 291, + 718, + 385, + 458 + ], + "temperature": 0.4, + "avg_logprob": -0.3580510299817651, + "compression_ratio": 1.7621145374449338, + "no_speech_prob": 0.8322692513465881, + "confidence": 0.902, + "words": [ + { + "text": "Ready", + "start": 145.06, + "end": 145.26, + "confidence": 0.938 + }, + { + "text": "to", + "start": 145.26, + "end": 145.5, + "confidence": 0.997 + }, + { + "text": "go", + "start": 145.5, + "end": 145.58, + "confidence": 0.996 + }, + { + "text": "whenever", + "start": 145.58, + "end": 145.74, + "confidence": 0.85 + }, + { + "text": "you", + "start": 145.74, + "end": 145.92, + "confidence": 0.575 + }, + { + "text": "let", + "start": 145.92, + "end": 146.04, + "confidence": 0.97 + }, + { + "text": "me", + "start": 146.04, + "end": 146.16, + "confidence": 0.998 + }, + { + "text": "know", + "start": 146.16, + "end": 146.28, + "confidence": 0.992 + } + ] + }, + { + "id": 22, + "seek": 12018, + "start": 146.28, + "end": 147.84, + "text": " The road is long so put the pedal into the flow", + "tokens": [ + 440, + 3060, + 307, + 938, + 370, + 829, + 264, + 19122, + 666, + 264, + 3095 + ], + "temperature": 0.4, + "avg_logprob": -0.3580510299817651, + "compression_ratio": 1.7621145374449338, + "no_speech_prob": 0.8322692513465881, + "confidence": 0.944, + "words": [ + { + "text": "The", + "start": 146.28, + "end": 146.5, + "confidence": 0.977 + }, + { + "text": "road", + "start": 146.5, + "end": 146.64, + "confidence": 0.989 + }, + { + "text": "is", + "start": 146.64, + "end": 146.74, + "confidence": 0.977 + }, + { + "text": "long", + "start": 146.74, + "end": 146.9, + "confidence": 0.936 + }, + { + "text": "so", + "start": 146.9, + "end": 147.04, + "confidence": 0.811 + }, + { + "text": "put", + "start": 147.04, + "end": 147.16, + "confidence": 0.94 + }, + { + "text": "the", + "start": 147.16, + "end": 147.3, + "confidence": 0.969 + }, + { + "text": "pedal", + "start": 147.3, + "end": 147.4, + "confidence": 0.947 + }, + { + "text": "into", + "start": 147.4, + "end": 147.58, + "confidence": 0.955 + }, + { + "text": "the", + "start": 147.58, + "end": 147.76, + "confidence": 0.993 + }, + { + "text": "flow", + "start": 147.76, + "end": 147.84, + "confidence": 0.902 + } + ] + }, + { + "id": 23, + "seek": 12018, + "start": 147.96, + "end": 149.78, + "text": " The enemy on my trail, my energy unavailable", + "tokens": [ + 440, + 5945, + 322, + 452, + 9924, + 11, + 452, + 2281, + 36541, + 32699 + ], + "temperature": 0.4, + "avg_logprob": -0.3580510299817651, + "compression_ratio": 1.7621145374449338, + "no_speech_prob": 0.8322692513465881, + "confidence": 0.866, + "words": [ + { + "text": "The", + "start": 147.96, + "end": 148.08, + "confidence": 0.714 + }, + { + "text": "enemy", + "start": 148.08, + "end": 148.24, + "confidence": 0.473 + }, + { + "text": "on", + "start": 148.24, + "end": 148.44, + "confidence": 0.969 + }, + { + "text": "my", + "start": 148.44, + "end": 148.54, + "confidence": 0.977 + }, + { + "text": "trail,", + "start": 148.54, + "end": 148.76, + "confidence": 0.993 + }, + { + "text": "my", + "start": 148.76, + "end": 148.8, + "confidence": 0.988 + }, + { + "text": "energy", + "start": 148.8, + "end": 149.06, + "confidence": 0.993 + }, + { + "text": "unavailable", + "start": 149.06, + "end": 149.78, + "confidence": 0.935 + } + ] + }, + { + "id": 24, + "seek": 14968, + "start": 150.0, + "end": 151.16, + "text": " I'm a tell a monster the way go", + "tokens": [ + 286, + 478, + 257, + 980, + 257, + 10090, + 264, + 636, + 352 + ], + "temperature": 0.4, + "avg_logprob": -0.5499832056745698, + "compression_ratio": 1.8025078369905956, + "no_speech_prob": 0.8352975249290466, + "confidence": 0.443, + "words": [ + { + "text": "I'm", + "start": 150.0, + "end": 150.18, + "confidence": 0.73 + }, + { + "text": "a", + "start": 150.18, + "end": 150.28, + "confidence": 0.203 + }, + { + "text": "tell", + "start": 150.28, + "end": 150.34, + "confidence": 0.507 + }, + { + "text": "a", + "start": 150.34, + "end": 150.46, + "confidence": 0.137 + }, + { + "text": "monster", + "start": 150.46, + "end": 150.66, + "confidence": 0.238 + }, + { + "text": "the", + "start": 150.66, + "end": 150.9, + "confidence": 0.585 + }, + { + "text": "way", + "start": 150.9, + "end": 150.98, + "confidence": 0.953 + }, + { + "text": "go", + "start": 150.98, + "end": 151.16, + "confidence": 0.664 + } + ] + }, + { + "id": 25, + "seek": 14968, + "start": 151.2, + "end": 152.54, + "text": " Way when the plot on my track to the top", + "tokens": [ + 9558, + 562, + 264, + 7542, + 322, + 452, + 2837, + 281, + 264, + 1192 + ], + "temperature": 0.4, + "avg_logprob": -0.5499832056745698, + "compression_ratio": 1.8025078369905956, + "no_speech_prob": 0.8352975249290466, + "confidence": 0.517, + "words": [ + { + "text": "Way", + "start": 151.2, + "end": 151.38, + "confidence": 0.102 + }, + { + "text": "when", + "start": 151.38, + "end": 151.54, + "confidence": 0.434 + }, + { + "text": "the", + "start": 151.54, + "end": 151.66, + "confidence": 0.263 + }, + { + "text": "plot", + "start": 151.66, + "end": 151.78, + "confidence": 0.627 + }, + { + "text": "on", + "start": 151.78, + "end": 151.92, + "confidence": 0.605 + }, + { + "text": "my", + "start": 151.92, + "end": 152.0, + "confidence": 0.975 + }, + { + "text": "track", + "start": 152.0, + "end": 152.14, + "confidence": 0.338 + }, + { + "text": "to", + "start": 152.14, + "end": 152.32, + "confidence": 0.946 + }, + { + "text": "the", + "start": 152.32, + "end": 152.4, + "confidence": 0.991 + }, + { + "text": "top", + "start": 152.4, + "end": 152.54, + "confidence": 0.993 + } + ] + }, + { + "id": 26, + "seek": 14968, + "start": 152.54, + "end": 154.32, + "text": " I been out of shape thinking that I'm a box I'm an astronaut", + "tokens": [ + 286, + 668, + 484, + 295, + 3909, + 1953, + 300, + 286, + 478, + 257, + 2424, + 286, + 478, + 364, + 18516 + ], + "temperature": 0.4, + "avg_logprob": -0.5499832056745698, + "compression_ratio": 1.8025078369905956, + "no_speech_prob": 0.8352975249290466, + "confidence": 0.667, + "words": [ + { + "text": "I", + "start": 152.54, + "end": 152.7, + "confidence": 0.972 + }, + { + "text": "been", + "start": 152.7, + "end": 152.76, + "confidence": 0.691 + }, + { + "text": "out", + "start": 152.76, + "end": 152.9, + "confidence": 0.72 + }, + { + "text": "of", + "start": 152.9, + "end": 153.0, + "confidence": 0.959 + }, + { + "text": "shape", + "start": 153.0, + "end": 153.1, + "confidence": 0.998 + }, + { + "text": "thinking", + "start": 153.1, + "end": 153.3, + "confidence": 0.385 + }, + { + "text": "that", + "start": 153.3, + "end": 153.5, + "confidence": 0.353 + }, + { + "text": "I'm", + "start": 153.5, + "end": 153.66, + "confidence": 0.572 + }, + { + "text": "a", + "start": 153.66, + "end": 153.7, + "confidence": 0.703 + }, + { + "text": "box", + "start": 153.7, + "end": 153.74, + "confidence": 0.874 + }, + { + "text": "I'm", + "start": 153.74, + "end": 153.92, + "confidence": 0.451 + }, + { + "text": "an", + "start": 153.92, + "end": 153.96, + "confidence": 0.976 + }, + { + "text": "astronaut", + "start": 153.96, + "end": 154.32, + "confidence": 0.926 + } + ] + }, + { + "id": 27, + "seek": 14968, + "start": 154.52, + "end": 156.34, + "text": " Blast it off the planet rock the cause catastrophe", + "tokens": [ + 2177, + 525, + 309, + 766, + 264, + 5054, + 3727, + 264, + 3082, + 36043 + ], + "temperature": 0.4, + "avg_logprob": -0.5499832056745698, + "compression_ratio": 1.8025078369905956, + "no_speech_prob": 0.8352975249290466, + "confidence": 0.583, + "words": [ + { + "text": "Blast", + "start": 154.52, + "end": 154.76, + "confidence": 0.476 + }, + { + "text": "it", + "start": 154.76, + "end": 154.9, + "confidence": 0.954 + }, + { + "text": "off", + "start": 154.9, + "end": 155.02, + "confidence": 0.984 + }, + { + "text": "the", + "start": 155.02, + "end": 155.2, + "confidence": 0.956 + }, + { + "text": "planet", + "start": 155.2, + "end": 155.34, + "confidence": 0.99 + }, + { + "text": "rock", + "start": 155.34, + "end": 155.52, + "confidence": 0.24 + }, + { + "text": "the", + "start": 155.52, + "end": 155.68, + "confidence": 0.301 + }, + { + "text": "cause", + "start": 155.68, + "end": 155.88, + "confidence": 0.701 + }, + { + "text": "catastrophe", + "start": 155.88, + "end": 156.34, + "confidence": 0.444 + } + ] + }, + { + "id": 28, + "seek": 14968, + "start": 156.44, + "end": 158.08, + "text": " And it matters more because ahead and not ahead", + "tokens": [ + 400, + 309, + 7001, + 544, + 570, + 2286, + 293, + 406, + 2286 + ], + "temperature": 0.4, + "avg_logprob": -0.5499832056745698, + "compression_ratio": 1.8025078369905956, + "no_speech_prob": 0.8352975249290466, + "confidence": 0.721, + "words": [ + { + "text": "And", + "start": 156.44, + "end": 156.64, + "confidence": 0.828 + }, + { + "text": "it", + "start": 156.64, + "end": 156.78, + "confidence": 0.715 + }, + { + "text": "matters", + "start": 156.78, + "end": 156.94, + "confidence": 0.994 + }, + { + "text": "more", + "start": 156.94, + "end": 157.16, + "confidence": 0.981 + }, + { + "text": "because", + "start": 157.16, + "end": 157.38, + "confidence": 0.909 + }, + { + "text": "ahead", + "start": 157.38, + "end": 157.64, + "confidence": 0.432 + }, + { + "text": "and", + "start": 157.64, + "end": 157.82, + "confidence": 0.616 + }, + { + "text": "not", + "start": 157.82, + "end": 157.94, + "confidence": 0.716 + }, + { + "text": "ahead", + "start": 157.94, + "end": 158.08, + "confidence": 0.524 + } + ] + }, + { + "id": 29, + "seek": 14968, + "start": 158.1, + "end": 159.74, + "text": " I thought about wreaking havoc on an opposition", + "tokens": [ + 286, + 1194, + 466, + 46674, + 2456, + 47367, + 322, + 364, + 13504 + ], + "temperature": 0.4, + "avg_logprob": -0.5499832056745698, + "compression_ratio": 1.8025078369905956, + "no_speech_prob": 0.8352975249290466, + "confidence": 0.963, + "words": [ + { + "text": "I", + "start": 158.1, + "end": 158.24, + "confidence": 0.986 + }, + { + "text": "thought", + "start": 158.24, + "end": 158.36, + "confidence": 0.977 + }, + { + "text": "about", + "start": 158.36, + "end": 158.58, + "confidence": 0.975 + }, + { + "text": "wreaking", + "start": 158.58, + "end": 158.84, + "confidence": 0.944 + }, + { + "text": "havoc", + "start": 158.84, + "end": 159.08, + "confidence": 1.0 + }, + { + "text": "on", + "start": 159.08, + "end": 159.3, + "confidence": 0.944 + }, + { + "text": "an", + "start": 159.3, + "end": 159.44, + "confidence": 0.913 + }, + { + "text": "opposition", + "start": 159.44, + "end": 159.74, + "confidence": 0.987 + } + ] + }, + { + "id": 30, + "seek": 14968, + "start": 159.88, + "end": 161.52, + "text": " Kinda shockin' they want it static with precision", + "tokens": [ + 35553, + 5588, + 259, + 6, + 436, + 528, + 309, + 13437, + 365, + 18356 + ], + "temperature": 0.4, + "avg_logprob": -0.5499832056745698, + "compression_ratio": 1.8025078369905956, + "no_speech_prob": 0.8352975249290466, + "confidence": 0.537, + "words": [ + { + "text": "Kinda", + "start": 159.88, + "end": 160.1, + "confidence": 0.574 + }, + { + "text": "shockin'", + "start": 160.1, + "end": 160.5, + "confidence": 0.408 + }, + { + "text": "they", + "start": 160.5, + "end": 160.58, + "confidence": 0.371 + }, + { + "text": "want", + "start": 160.58, + "end": 160.74, + "confidence": 0.454 + }, + { + "text": "it", + "start": 160.74, + "end": 160.84, + "confidence": 0.577 + }, + { + "text": "static", + "start": 160.84, + "end": 161.02, + "confidence": 0.993 + }, + { + "text": "with", + "start": 161.02, + "end": 161.22, + "confidence": 0.609 + }, + { + "text": "precision", + "start": 161.22, + "end": 161.52, + "confidence": 0.877 + } + ] + }, + { + "id": 31, + "seek": 14968, + "start": 161.62, + "end": 163.36, + "text": " I'm automatic quarterback I ain't talkin' second", + "tokens": [ + 286, + 478, + 12509, + 31952, + 286, + 7862, + 380, + 39243, + 6, + 1150 + ], + "temperature": 0.4, + "avg_logprob": -0.5499832056745698, + "compression_ratio": 1.8025078369905956, + "no_speech_prob": 0.8352975249290466, + "confidence": 0.735, + "words": [ + { + "text": "I'm", + "start": 161.62, + "end": 161.78, + "confidence": 0.935 + }, + { + "text": "automatic", + "start": 161.78, + "end": 162.18, + "confidence": 0.975 + }, + { + "text": "quarterback", + "start": 162.18, + "end": 162.58, + "confidence": 0.419 + }, + { + "text": "I", + "start": 162.58, + "end": 162.8, + "confidence": 0.405 + }, + { + "text": "ain't", + "start": 162.8, + "end": 162.88, + "confidence": 0.968 + }, + { + "text": "talkin'", + "start": 162.88, + "end": 163.18, + "confidence": 0.783 + }, + { + "text": "second", + "start": 163.18, + "end": 163.36, + "confidence": 0.556 + } + ] + }, + { + "id": 32, + "seek": 14968, + "start": 163.4, + "end": 164.58, + "text": " Pack it pack it up I don't panic", + "tokens": [ + 18466, + 309, + 2844, + 309, + 493, + 286, + 500, + 380, + 14783 + ], + "temperature": 0.4, + "avg_logprob": -0.5499832056745698, + "compression_ratio": 1.8025078369905956, + "no_speech_prob": 0.8352975249290466, + "confidence": 0.786, + "words": [ + { + "text": "Pack", + "start": 163.4, + "end": 163.6, + "confidence": 0.931 + }, + { + "text": "it", + "start": 163.6, + "end": 163.66, + "confidence": 0.88 + }, + { + "text": "pack", + "start": 163.66, + "end": 163.82, + "confidence": 0.298 + }, + { + "text": "it", + "start": 163.82, + "end": 164.04, + "confidence": 0.994 + }, + { + "text": "up", + "start": 164.04, + "end": 164.1, + "confidence": 0.977 + }, + { + "text": "I", + "start": 164.1, + "end": 164.2, + "confidence": 0.637 + }, + { + "text": "don't", + "start": 164.2, + "end": 164.54, + "confidence": 0.87 + }, + { + "text": "panic", + "start": 164.54, + "end": 164.58, + "confidence": 0.997 + } + ] + }, + { + "id": 33, + "seek": 14968, + "start": 164.58, + "end": 165.7, + "text": " Better batter up who the baddest", + "tokens": [ + 15753, + 4220, + 493, + 567, + 264, + 1578, + 23748 + ], + "temperature": 0.4, + "avg_logprob": -0.5499832056745698, + "compression_ratio": 1.8025078369905956, + "no_speech_prob": 0.8352975249290466, + "confidence": 0.703, + "words": [ + { + "text": "Better", + "start": 164.58, + "end": 164.82, + "confidence": 0.627 + }, + { + "text": "batter", + "start": 164.82, + "end": 165.1, + "confidence": 0.265 + }, + { + "text": "up", + "start": 165.1, + "end": 165.24, + "confidence": 0.963 + }, + { + "text": "who", + "start": 165.24, + "end": 165.4, + "confidence": 0.861 + }, + { + "text": "the", + "start": 165.4, + "end": 165.52, + "confidence": 0.973 + }, + { + "text": "baddest", + "start": 165.52, + "end": 165.7, + "confidence": 0.797 + } + ] + }, + { + "id": 34, + "seek": 14968, + "start": 165.7, + "end": 166.74, + "text": " It don't matter cause we it's your", + "tokens": [ + 467, + 500, + 380, + 1871, + 3082, + 321, + 309, + 311, + 428 + ], + "temperature": 0.4, + "avg_logprob": -0.5499832056745698, + "compression_ratio": 1.8025078369905956, + "no_speech_prob": 0.8352975249290466, + "confidence": 0.727, + "words": [ + { + "text": "It", + "start": 165.7, + "end": 165.9, + "confidence": 0.979 + }, + { + "text": "don't", + "start": 165.9, + "end": 166.14, + "confidence": 0.995 + }, + { + "text": "matter", + "start": 166.14, + "end": 166.18, + "confidence": 0.998 + }, + { + "text": "cause", + "start": 166.18, + "end": 166.4, + "confidence": 0.588 + }, + { + "text": "we", + "start": 166.4, + "end": 166.52, + "confidence": 0.973 + }, + { + "text": "it's", + "start": 166.52, + "end": 166.7, + "confidence": 0.404 + }, + { + "text": "your", + "start": 166.7, + "end": 166.74, + "confidence": 0.632 + } + ] + }, + { + "id": 35, + "seek": 14968, + "start": 166.8, + "end": 169.52, + "text": " Everybody wants to be my enemy", + "tokens": [ + 7646, + 2738, + 281, + 312, + 452, + 5945 + ], + "temperature": 0.4, + "avg_logprob": -0.5499832056745698, + "compression_ratio": 1.8025078369905956, + "no_speech_prob": 0.8352975249290466, + "confidence": 0.966, + "words": [ + { + "text": "Everybody", + "start": 166.8, + "end": 167.34, + "confidence": 0.896 + }, + { + "text": "wants", + "start": 167.34, + "end": 167.74, + "confidence": 0.97 + }, + { + "text": "to", + "start": 167.74, + "end": 167.94, + "confidence": 0.996 + }, + { + "text": "be", + "start": 167.94, + "end": 168.14, + "confidence": 0.996 + }, + { + "text": "my", + "start": 168.14, + "end": 168.46, + "confidence": 0.991 + }, + { + "text": "enemy", + "start": 168.46, + "end": 169.52, + "confidence": 0.95 + } + ] + }, + { + "id": 36, + "seek": 14968, + "start": 170.66, + "end": 172.2, + "text": " Spare the sympathy", + "tokens": [ + 1738, + 543, + 264, + 33240 + ], + "temperature": 0.4, + "avg_logprob": -0.5499832056745698, + "compression_ratio": 1.8025078369905956, + "no_speech_prob": 0.8352975249290466, + "confidence": 0.687, + "words": [ + { + "text": "Spare", + "start": 170.66, + "end": 171.22, + "confidence": 0.494 + }, + { + "text": "the", + "start": 171.22, + "end": 171.46, + "confidence": 0.976 + }, + { + "text": "sympathy", + "start": 171.46, + "end": 172.2, + "confidence": 0.937 + } + ] + }, + { + "id": 37, + "seek": 14968, + "start": 172.96, + "end": 176.18, + "text": " Everybody wants to be my enemy", + "tokens": [ + 7646, + 2738, + 281, + 312, + 452, + 5945 + ], + "temperature": 0.4, + "avg_logprob": -0.5499832056745698, + "compression_ratio": 1.8025078369905956, + "no_speech_prob": 0.8352975249290466, + "confidence": 0.983, + "words": [ + { + "text": "Everybody", + "start": 172.96, + "end": 173.62, + "confidence": 0.994 + }, + { + "text": "wants", + "start": 173.62, + "end": 174.02, + "confidence": 0.99 + }, + { + "text": "to", + "start": 174.02, + "end": 174.36, + "confidence": 0.999 + }, + { + "text": "be", + "start": 174.36, + "end": 175.0, + "confidence": 0.999 + }, + { + "text": "my", + "start": 175.0, + "end": 175.4, + "confidence": 0.924 + }, + { + "text": "enemy", + "start": 175.4, + "end": 176.18, + "confidence": 0.996 + } + ] + }, + { + "id": 38, + "seek": 14968, + "start": 176.84, + "end": 178.44, + "text": " Oh the misery", + "tokens": [ + 876, + 264, + 32309 + ], + "temperature": 0.4, + "avg_logprob": -0.5499832056745698, + "compression_ratio": 1.8025078369905956, + "no_speech_prob": 0.8352975249290466, + "confidence": 0.813, + "words": [ + { + "text": "Oh", + "start": 176.84, + "end": 177.48, + "confidence": 0.677 + }, + { + "text": "the", + "start": 177.48, + "end": 177.66, + "confidence": 0.794 + }, + { + "text": "misery", + "start": 177.66, + "end": 178.44, + "confidence": 0.998 + } + ] + }, + { + "id": 39, + "seek": 17906, + "start": 179.28, + "end": 181.44, + "text": " Everybody wants to be my enemy", + "tokens": [ + 7646, + 2738, + 281, + 312, + 452, + 5945 + ], + "temperature": 0.4, + "avg_logprob": -0.6545042613195995, + "compression_ratio": 1.97, + "no_speech_prob": 0.5597606301307678, + "confidence": 0.955, + "words": [ + { + "text": "Everybody", + "start": 179.28, + "end": 179.84, + "confidence": 0.802 + }, + { + "text": "wants", + "start": 179.84, + "end": 180.22, + "confidence": 0.984 + }, + { + "text": "to", + "start": 180.22, + "end": 180.44, + "confidence": 0.997 + }, + { + "text": "be", + "start": 180.44, + "end": 180.58, + "confidence": 0.998 + }, + { + "text": "my", + "start": 180.58, + "end": 180.86, + "confidence": 0.992 + }, + { + "text": "enemy", + "start": 180.86, + "end": 181.44, + "confidence": 0.976 + } + ] + }, + { + "id": 40, + "seek": 17906, + "start": 183.12, + "end": 184.52, + "text": " Spare the sympathy", + "tokens": [ + 1738, + 543, + 264, + 33240 + ], + "temperature": 0.4, + "avg_logprob": -0.6545042613195995, + "compression_ratio": 1.97, + "no_speech_prob": 0.5597606301307678, + "confidence": 0.678, + "words": [ + { + "text": "Spare", + "start": 183.12, + "end": 183.7, + "confidence": 0.479 + }, + { + "text": "the", + "start": 183.7, + "end": 183.92, + "confidence": 0.934 + }, + { + "text": "sympathy", + "start": 183.92, + "end": 184.52, + "confidence": 0.986 + } + ] + }, + { + "id": 41, + "seek": 17906, + "start": 185.56, + "end": 188.46, + "text": " Everybody wants to be my enemy", + "tokens": [ + 7646, + 2738, + 281, + 312, + 452, + 5945 + ], + "temperature": 0.4, + "avg_logprob": -0.6545042613195995, + "compression_ratio": 1.97, + "no_speech_prob": 0.5597606301307678, + "confidence": 0.959, + "words": [ + { + "text": "Everybody", + "start": 185.56, + "end": 186.08, + "confidence": 0.993 + }, + { + "text": "wants", + "start": 186.08, + "end": 186.46, + "confidence": 0.99 + }, + { + "text": "to", + "start": 186.46, + "end": 186.72, + "confidence": 0.999 + }, + { + "text": "be", + "start": 186.72, + "end": 187.22, + "confidence": 0.999 + }, + { + "text": "my", + "start": 187.22, + "end": 187.86, + "confidence": 0.798 + }, + { + "text": "enemy", + "start": 187.86, + "end": 188.46, + "confidence": 0.991 + } + ] + }, + { + "id": 42, + "seek": 17906, + "start": 190.1, + "end": 191.96, + "text": " I swear, I swear I'll never be a saint", + "tokens": [ + 286, + 11902, + 11, + 286, + 11902, + 286, + 603, + 1128, + 312, + 257, + 28374 + ], + "temperature": 0.4, + "avg_logprob": -0.6545042613195995, + "compression_ratio": 1.97, + "no_speech_prob": 0.5597606301307678, + "confidence": 0.662, + "words": [ + { + "text": "I", + "start": 190.1, + "end": 190.14, + "confidence": 0.107 + }, + { + "text": "swear,", + "start": 190.14, + "end": 190.44, + "confidence": 0.908 + }, + { + "text": "I", + "start": 190.44, + "end": 190.48, + "confidence": 0.962 + }, + { + "text": "swear", + "start": 190.48, + "end": 190.52, + "confidence": 0.867 + }, + { + "text": "I'll", + "start": 190.52, + "end": 191.24, + "confidence": 0.628 + }, + { + "text": "never", + "start": 191.24, + "end": 191.28, + "confidence": 0.987 + }, + { + "text": "be", + "start": 191.28, + "end": 191.56, + "confidence": 0.993 + }, + { + "text": "a", + "start": 191.56, + "end": 191.76, + "confidence": 0.602 + }, + { + "text": "saint", + "start": 191.76, + "end": 191.96, + "confidence": 0.858 + } + ] + }, + { + "id": 43, + "seek": 17906, + "start": 192.12, + "end": 194.66, + "text": " I swear, my enemy", + "tokens": [ + 286, + 11902, + 11, + 452, + 5945 + ], + "temperature": 0.4, + "avg_logprob": -0.6545042613195995, + "compression_ratio": 1.97, + "no_speech_prob": 0.5597606301307678, + "confidence": 0.529, + "words": [ + { + "text": "I", + "start": 192.12, + "end": 192.62, + "confidence": 0.35 + }, + { + "text": "swear,", + "start": 192.62, + "end": 193.88, + "confidence": 0.83 + }, + { + "text": "my", + "start": 193.88, + "end": 194.02, + "confidence": 0.279 + }, + { + "text": "enemy", + "start": 194.02, + "end": 194.66, + "confidence": 0.964 + } + ] + }, + { + "id": 44, + "seek": 17906, + "start": 196.34, + "end": 198.36, + "text": " I swear, I swear I'll never be a saint", + "tokens": [ + 286, + 11902, + 11, + 286, + 11902, + 286, + 603, + 1128, + 312, + 257, + 28374 + ], + "temperature": 0.4, + "avg_logprob": -0.6545042613195995, + "compression_ratio": 1.97, + "no_speech_prob": 0.5597606301307678, + "confidence": 0.976, + "words": [ + { + "text": "I", + "start": 196.34, + "end": 196.38, + "confidence": 0.945 + }, + { + "text": "swear,", + "start": 196.38, + "end": 196.56, + "confidence": 0.999 + }, + { + "text": "I", + "start": 196.56, + "end": 196.6, + "confidence": 0.875 + }, + { + "text": "swear", + "start": 196.6, + "end": 196.84, + "confidence": 0.995 + }, + { + "text": "I'll", + "start": 196.84, + "end": 197.36, + "confidence": 0.982 + }, + { + "text": "never", + "start": 197.36, + "end": 197.5, + "confidence": 0.999 + }, + { + "text": "be", + "start": 197.5, + "end": 197.8, + "confidence": 0.999 + }, + { + "text": "a", + "start": 197.8, + "end": 198.04, + "confidence": 0.997 + }, + { + "text": "saint", + "start": 198.04, + "end": 198.36, + "confidence": 0.994 + } + ] + }, + { + "id": 45, + "seek": 19822, + "start": 198.44, + "end": 200.22, + "text": " You got to be yourself!", + "tokens": [ + 50364, + 509, + 658, + 281, + 312, + 1803, + 0, + 50464 + ], + "temperature": 0.4, + "avg_logprob": -0.8683164384629991, + "compression_ratio": 0.7419354838709677, + "no_speech_prob": 0.6954998970031738, + "confidence": 0.365, + "words": [ + { + "text": "You", + "start": 198.44, + "end": 198.62, + "confidence": 0.054 + }, + { + "text": "got", + "start": 198.62, + "end": 198.8, + "confidence": 0.163 + }, + { + "text": "to", + "start": 198.8, + "end": 198.98, + "confidence": 0.918 + }, + { + "text": "be", + "start": 198.98, + "end": 199.06, + "confidence": 0.87 + }, + { + "text": "yourself!", + "start": 199.06, + "end": 200.22, + "confidence": 0.913 + } + ] + } + ], + "language": "en" +} \ No newline at end of file diff --git a/tests/expected/corner_cases.cpu/nocond_music.mp4.words.json b/tests/expected/corner_cases.cpu/nocond_music.mp4.words.json new file mode 100644 index 0000000000000000000000000000000000000000..ddd3ddeb2eb18ea98bb99dffe65159d92a046d85 --- /dev/null +++ b/tests/expected/corner_cases.cpu/nocond_music.mp4.words.json @@ -0,0 +1,2687 @@ +{ + "text": " I Oh, the misery Everybody wants to be my enemy Spare the sympathy Everybody wants to be my enemy Look out for yourself My enemy Look out for yourself But I'm ready Your words up on the wall as you're praying for my phone And the laughter in the holes and the names that I've been called I stack it in my mind and I'm waiting for the time When I show you what it's like to be worse but in the mind Tell you you're the greatest But once you turn they hate us Oh, the misery Everybody wants to be my enemy Spare the sympathy Everybody wants to be my enemy Look out for yourself My enemy Look out for yourself Look, okay I'm hoping that somebody pray for me I'm praying that somebody hold for me. I'm staying where nobody's supposed to be. I propose to be in a wreck of emotions. Ready to go whenever you let me know. The road is long, so put the pedal into the flow. The enemy on my trail, my energy unavailable. I'ma tell them I said away, go away. When I'm plotting, I'ma drive to the top. I've been out of shape, thinking out of the box. I'm an astronaut, blasted off the planet. Rock the cars, catastrophic, and it matters more because I had it now. Had I thought about wreaking havoc on an opposition. Kind of shocking, they want it static. With precision, I'm automatic. Quarterback, I ain't talking second. Pack it, pack it up. I don't panic, better, better. Up who the baddest. it don't matter cause we is your enemy. I swear I'll never be insane You got to be yourself", + "segments": [ + { + "id": 0, + "seek": 0, + "start": 0.02, + "end": 0.4, + "text": " I", + "tokens": [ + 50364, + 286, + 50464 + ], + "temperature": 0.0, + "avg_logprob": -0.9367842674255371, + "compression_ratio": 0.1111111111111111, + "no_speech_prob": 0.7794302701950073, + "confidence": 0.032, + "words": [ + { + "text": "I", + "start": 0.02, + "end": 0.4, + "confidence": 0.032 + } + ] + }, + { + "id": 1, + "seek": 6000, + "start": 60.02, + "end": 69.26, + "text": " Oh, the misery Everybody wants to be my enemy", + "tokens": [ + 876, + 11, + 264, + 32309, + 7646, + 2738, + 281, + 312, + 452, + 5945 + ], + "temperature": 0.0, + "avg_logprob": -0.45698386972600763, + "compression_ratio": 1.62, + "no_speech_prob": 0.8689420819282532, + "confidence": 0.669, + "words": [ + { + "text": "Oh,", + "start": 60.02, + "end": 65.44, + "confidence": 0.084 + }, + { + "text": "the", + "start": 65.44, + "end": 65.48, + "confidence": 0.796 + }, + { + "text": "misery", + "start": 65.48, + "end": 66.08, + "confidence": 0.993 + }, + { + "text": "Everybody", + "start": 66.08, + "end": 67.62, + "confidence": 0.431 + }, + { + "text": "wants", + "start": 67.62, + "end": 68.0, + "confidence": 0.983 + }, + { + "text": "to", + "start": 68.0, + "end": 68.2, + "confidence": 0.993 + }, + { + "text": "be", + "start": 68.2, + "end": 68.4, + "confidence": 0.996 + }, + { + "text": "my", + "start": 68.4, + "end": 68.74, + "confidence": 0.984 + }, + { + "text": "enemy", + "start": 68.74, + "end": 69.26, + "confidence": 0.984 + } + ] + }, + { + "id": 2, + "seek": 6000, + "start": 70.9, + "end": 76.38, + "text": " Spare the sympathy Everybody wants to be my enemy", + "tokens": [ + 1738, + 543, + 264, + 33240, + 7646, + 2738, + 281, + 312, + 452, + 5945 + ], + "temperature": 0.0, + "avg_logprob": -0.45698386972600763, + "compression_ratio": 1.62, + "no_speech_prob": 0.8689420819282532, + "confidence": 0.934, + "words": [ + { + "text": "Spare", + "start": 70.9, + "end": 71.4, + "confidence": 0.812 + }, + { + "text": "the", + "start": 71.4, + "end": 71.74, + "confidence": 0.968 + }, + { + "text": "sympathy", + "start": 71.74, + "end": 72.58, + "confidence": 0.993 + }, + { + "text": "Everybody", + "start": 72.58, + "end": 73.88, + "confidence": 0.962 + }, + { + "text": "wants", + "start": 73.88, + "end": 74.24, + "confidence": 0.994 + }, + { + "text": "to", + "start": 74.24, + "end": 74.42, + "confidence": 0.999 + }, + { + "text": "be", + "start": 74.42, + "end": 75.36, + "confidence": 0.999 + }, + { + "text": "my", + "start": 75.36, + "end": 75.68, + "confidence": 0.837 + }, + { + "text": "enemy", + "start": 75.68, + "end": 76.38, + "confidence": 0.997 + } + ] + }, + { + "id": 3, + "seek": 6000, + "start": 79.94, + "end": 82.58, + "text": " Look out for yourself My enemy", + "tokens": [ + 2053, + 484, + 337, + 1803, + 1222, + 5945 + ], + "temperature": 0.0, + "avg_logprob": -0.45698386972600763, + "compression_ratio": 1.62, + "no_speech_prob": 0.8689420819282532, + "confidence": 0.774, + "words": [ + { + "text": "Look", + "start": 79.94, + "end": 80.14, + "confidence": 0.43 + }, + { + "text": "out", + "start": 80.14, + "end": 80.46, + "confidence": 0.991 + }, + { + "text": "for", + "start": 80.46, + "end": 80.6, + "confidence": 0.989 + }, + { + "text": "yourself", + "start": 80.6, + "end": 81.24, + "confidence": 0.97 + }, + { + "text": "My", + "start": 81.24, + "end": 81.88, + "confidence": 0.536 + }, + { + "text": "enemy", + "start": 81.88, + "end": 82.58, + "confidence": 0.98 + } + ] + }, + { + "id": 4, + "seek": 6000, + "start": 86.18, + "end": 88.46, + "text": " Look out for yourself But I'm ready", + "tokens": [ + 2053, + 484, + 337, + 1803, + 583, + 286, + 478, + 1919 + ], + "temperature": 0.0, + "avg_logprob": -0.45698386972600763, + "compression_ratio": 1.62, + "no_speech_prob": 0.8689420819282532, + "confidence": 0.927, + "words": [ + { + "text": "Look", + "start": 86.18, + "end": 86.4, + "confidence": 0.747 + }, + { + "text": "out", + "start": 86.4, + "end": 86.64, + "confidence": 0.988 + }, + { + "text": "for", + "start": 86.64, + "end": 86.82, + "confidence": 0.998 + }, + { + "text": "yourself", + "start": 86.82, + "end": 87.62, + "confidence": 0.999 + }, + { + "text": "But", + "start": 87.62, + "end": 87.88, + "confidence": 0.764 + }, + { + "text": "I'm", + "start": 87.88, + "end": 88.12, + "confidence": 0.989 + }, + { + "text": "ready", + "start": 88.12, + "end": 88.46, + "confidence": 0.995 + } + ] + }, + { + "id": 5, + "seek": 8856, + "start": 88.58, + "end": 91.58, + "text": " Your words up on the wall as you're praying for my phone", + "tokens": [ + 2260, + 2283, + 493, + 322, + 264, + 2929, + 382, + 291, + 434, + 15611, + 337, + 452, + 2593 + ], + "temperature": 0.0, + "avg_logprob": -0.2876515737394007, + "compression_ratio": 1.5869565217391304, + "no_speech_prob": 0.7907973527908325, + "confidence": 0.82, + "words": [ + { + "text": "Your", + "start": 88.58, + "end": 88.86, + "confidence": 0.549 + }, + { + "text": "words", + "start": 88.86, + "end": 89.12, + "confidence": 0.921 + }, + { + "text": "up", + "start": 89.12, + "end": 89.46, + "confidence": 0.965 + }, + { + "text": "on", + "start": 89.46, + "end": 89.6, + "confidence": 0.995 + }, + { + "text": "the", + "start": 89.6, + "end": 89.66, + "confidence": 0.991 + }, + { + "text": "wall", + "start": 89.66, + "end": 90.12, + "confidence": 0.88 + }, + { + "text": "as", + "start": 90.12, + "end": 90.34, + "confidence": 0.403 + }, + { + "text": "you're", + "start": 90.34, + "end": 90.8, + "confidence": 0.828 + }, + { + "text": "praying", + "start": 90.8, + "end": 90.84, + "confidence": 0.967 + }, + { + "text": "for", + "start": 90.84, + "end": 91.06, + "confidence": 0.97 + }, + { + "text": "my", + "start": 91.06, + "end": 91.24, + "confidence": 0.989 + }, + { + "text": "phone", + "start": 91.24, + "end": 91.58, + "confidence": 0.702 + } + ] + }, + { + "id": 6, + "seek": 8856, + "start": 91.78, + "end": 94.68, + "text": " And the laughter in the holes and the names that I've been called", + "tokens": [ + 400, + 264, + 13092, + 294, + 264, + 8118, + 293, + 264, + 5288, + 300, + 286, + 600, + 668, + 1219 + ], + "temperature": 0.0, + "avg_logprob": -0.2876515737394007, + "compression_ratio": 1.5869565217391304, + "no_speech_prob": 0.7907973527908325, + "confidence": 0.885, + "words": [ + { + "text": "And", + "start": 91.78, + "end": 91.92, + "confidence": 0.844 + }, + { + "text": "the", + "start": 91.92, + "end": 92.0, + "confidence": 0.987 + }, + { + "text": "laughter", + "start": 92.0, + "end": 92.4, + "confidence": 0.994 + }, + { + "text": "in", + "start": 92.4, + "end": 92.72, + "confidence": 0.849 + }, + { + "text": "the", + "start": 92.72, + "end": 92.92, + "confidence": 0.997 + }, + { + "text": "holes", + "start": 92.92, + "end": 93.2, + "confidence": 0.609 + }, + { + "text": "and", + "start": 93.2, + "end": 93.44, + "confidence": 0.596 + }, + { + "text": "the", + "start": 93.44, + "end": 93.54, + "confidence": 0.991 + }, + { + "text": "names", + "start": 93.54, + "end": 93.82, + "confidence": 0.991 + }, + { + "text": "that", + "start": 93.82, + "end": 94.12, + "confidence": 0.957 + }, + { + "text": "I've", + "start": 94.12, + "end": 94.28, + "confidence": 0.915 + }, + { + "text": "been", + "start": 94.28, + "end": 94.42, + "confidence": 0.986 + }, + { + "text": "called", + "start": 94.42, + "end": 94.68, + "confidence": 0.912 + } + ] + }, + { + "id": 7, + "seek": 8856, + "start": 95.0, + "end": 97.82, + "text": " I stack it in my mind and I'm waiting for the time", + "tokens": [ + 286, + 8630, + 309, + 294, + 452, + 1575, + 293, + 286, + 478, + 3806, + 337, + 264, + 565 + ], + "temperature": 0.0, + "avg_logprob": -0.2876515737394007, + "compression_ratio": 1.5869565217391304, + "no_speech_prob": 0.7907973527908325, + "confidence": 0.96, + "words": [ + { + "text": "I", + "start": 95.0, + "end": 95.12, + "confidence": 0.987 + }, + { + "text": "stack", + "start": 95.12, + "end": 95.42, + "confidence": 0.825 + }, + { + "text": "it", + "start": 95.42, + "end": 95.7, + "confidence": 0.995 + }, + { + "text": "in", + "start": 95.7, + "end": 95.82, + "confidence": 0.996 + }, + { + "text": "my", + "start": 95.82, + "end": 96.02, + "confidence": 0.994 + }, + { + "text": "mind", + "start": 96.02, + "end": 96.4, + "confidence": 0.999 + }, + { + "text": "and", + "start": 96.4, + "end": 96.62, + "confidence": 0.762 + }, + { + "text": "I'm", + "start": 96.62, + "end": 97.02, + "confidence": 0.991 + }, + { + "text": "waiting", + "start": 97.02, + "end": 97.06, + "confidence": 0.988 + }, + { + "text": "for", + "start": 97.06, + "end": 97.32, + "confidence": 0.996 + }, + { + "text": "the", + "start": 97.32, + "end": 97.5, + "confidence": 0.996 + }, + { + "text": "time", + "start": 97.5, + "end": 97.82, + "confidence": 0.996 + } + ] + }, + { + "id": 8, + "seek": 8856, + "start": 97.98, + "end": 101.24, + "text": " When I show you what it's like to be worse but in the mind", + "tokens": [ + 1133, + 286, + 855, + 291, + 437, + 309, + 311, + 411, + 281, + 312, + 5324, + 457, + 294, + 264, + 1575 + ], + "temperature": 0.0, + "avg_logprob": -0.2876515737394007, + "compression_ratio": 1.5869565217391304, + "no_speech_prob": 0.7907973527908325, + "confidence": 0.755, + "words": [ + { + "text": "When", + "start": 97.98, + "end": 98.16, + "confidence": 0.923 + }, + { + "text": "I", + "start": 98.16, + "end": 98.22, + "confidence": 0.993 + }, + { + "text": "show", + "start": 98.22, + "end": 98.48, + "confidence": 0.959 + }, + { + "text": "you", + "start": 98.48, + "end": 98.74, + "confidence": 0.994 + }, + { + "text": "what", + "start": 98.74, + "end": 98.96, + "confidence": 0.996 + }, + { + "text": "it's", + "start": 98.96, + "end": 99.38, + "confidence": 0.988 + }, + { + "text": "like", + "start": 99.38, + "end": 99.42, + "confidence": 0.998 + }, + { + "text": "to", + "start": 99.42, + "end": 99.68, + "confidence": 0.877 + }, + { + "text": "be", + "start": 99.68, + "end": 99.78, + "confidence": 0.997 + }, + { + "text": "worse", + "start": 99.78, + "end": 100.04, + "confidence": 0.444 + }, + { + "text": "but", + "start": 100.04, + "end": 100.36, + "confidence": 0.196 + }, + { + "text": "in", + "start": 100.36, + "end": 100.52, + "confidence": 0.862 + }, + { + "text": "the", + "start": 100.52, + "end": 100.8, + "confidence": 0.426 + }, + { + "text": "mind", + "start": 100.8, + "end": 101.24, + "confidence": 0.621 + } + ] + }, + { + "id": 9, + "seek": 8856, + "start": 101.32, + "end": 106.28, + "text": " Tell you you're the greatest", + "tokens": [ + 5115, + 291, + 291, + 434, + 264, + 6636 + ], + "temperature": 0.0, + "avg_logprob": -0.2876515737394007, + "compression_ratio": 1.5869565217391304, + "no_speech_prob": 0.7907973527908325, + "confidence": 0.94, + "words": [ + { + "text": "Tell", + "start": 101.32, + "end": 102.08, + "confidence": 0.937 + }, + { + "text": "you", + "start": 102.08, + "end": 102.68, + "confidence": 0.993 + }, + { + "text": "you're", + "start": 102.68, + "end": 103.66, + "confidence": 0.873 + }, + { + "text": "the", + "start": 103.66, + "end": 104.14, + "confidence": 0.985 + }, + { + "text": "greatest", + "start": 104.14, + "end": 106.28, + "confidence": 0.986 + } + ] + }, + { + "id": 10, + "seek": 8856, + "start": 107.18, + "end": 113.0, + "text": " But once you turn they hate us", + "tokens": [ + 583, + 1564, + 291, + 1261, + 436, + 4700, + 505 + ], + "temperature": 0.0, + "avg_logprob": -0.2876515737394007, + "compression_ratio": 1.5869565217391304, + "no_speech_prob": 0.7907973527908325, + "confidence": 0.909, + "words": [ + { + "text": "But", + "start": 107.18, + "end": 107.52, + "confidence": 0.963 + }, + { + "text": "once", + "start": 107.52, + "end": 108.34, + "confidence": 0.79 + }, + { + "text": "you", + "start": 108.34, + "end": 108.9, + "confidence": 0.998 + }, + { + "text": "turn", + "start": 108.9, + "end": 109.84, + "confidence": 0.913 + }, + { + "text": "they", + "start": 109.84, + "end": 110.34, + "confidence": 0.754 + }, + { + "text": "hate", + "start": 110.34, + "end": 111.9, + "confidence": 0.985 + }, + { + "text": "us", + "start": 111.9, + "end": 113.0, + "confidence": 0.999 + } + ] + }, + { + "id": 11, + "seek": 11312, + "start": 113.14, + "end": 119.18, + "text": " Oh, the misery Everybody wants to be my enemy", + "tokens": [ + 876, + 11, + 264, + 32309, + 7646, + 2738, + 281, + 312, + 452, + 5945 + ], + "temperature": 0.0, + "avg_logprob": -0.2736021077857827, + "compression_ratio": 1.6610169491525424, + "no_speech_prob": 0.8637643456459045, + "confidence": 0.804, + "words": [ + { + "text": "Oh,", + "start": 113.14, + "end": 115.14, + "confidence": 0.317 + }, + { + "text": "the", + "start": 115.14, + "end": 115.34, + "confidence": 0.964 + }, + { + "text": "misery", + "start": 115.34, + "end": 116.08, + "confidence": 0.995 + }, + { + "text": "Everybody", + "start": 116.08, + "end": 117.48, + "confidence": 0.482 + }, + { + "text": "wants", + "start": 117.48, + "end": 117.86, + "confidence": 0.986 + }, + { + "text": "to", + "start": 117.86, + "end": 118.08, + "confidence": 0.995 + }, + { + "text": "be", + "start": 118.08, + "end": 118.26, + "confidence": 0.998 + }, + { + "text": "my", + "start": 118.26, + "end": 118.58, + "confidence": 0.993 + }, + { + "text": "enemy", + "start": 118.58, + "end": 119.18, + "confidence": 0.983 + } + ] + }, + { + "id": 12, + "seek": 11312, + "start": 119.94, + "end": 126.08, + "text": " Spare the sympathy Everybody wants to be my enemy", + "tokens": [ + 1738, + 543, + 264, + 33240, + 7646, + 2738, + 281, + 312, + 452, + 5945 + ], + "temperature": 0.0, + "avg_logprob": -0.2736021077857827, + "compression_ratio": 1.6610169491525424, + "no_speech_prob": 0.8637643456459045, + "confidence": 0.874, + "words": [ + { + "text": "Spare", + "start": 119.94, + "end": 121.26, + "confidence": 0.576 + }, + { + "text": "the", + "start": 121.26, + "end": 121.62, + "confidence": 0.985 + }, + { + "text": "sympathy", + "start": 121.62, + "end": 122.32, + "confidence": 0.994 + }, + { + "text": "Everybody", + "start": 122.32, + "end": 123.76, + "confidence": 0.969 + }, + { + "text": "wants", + "start": 123.76, + "end": 124.12, + "confidence": 0.994 + }, + { + "text": "to", + "start": 124.12, + "end": 124.6, + "confidence": 0.999 + }, + { + "text": "be", + "start": 124.6, + "end": 125.34, + "confidence": 0.999 + }, + { + "text": "my", + "start": 125.34, + "end": 125.58, + "confidence": 0.835 + }, + { + "text": "enemy", + "start": 125.58, + "end": 126.08, + "confidence": 0.998 + } + ] + }, + { + "id": 13, + "seek": 11312, + "start": 129.86, + "end": 132.32, + "text": " Look out for yourself My enemy", + "tokens": [ + 2053, + 484, + 337, + 1803, + 1222, + 5945 + ], + "temperature": 0.0, + "avg_logprob": -0.2736021077857827, + "compression_ratio": 1.6610169491525424, + "no_speech_prob": 0.8637643456459045, + "confidence": 0.794, + "words": [ + { + "text": "Look", + "start": 129.86, + "end": 130.08, + "confidence": 0.592 + }, + { + "text": "out", + "start": 130.08, + "end": 130.3, + "confidence": 0.892 + }, + { + "text": "for", + "start": 130.3, + "end": 130.44, + "confidence": 0.978 + }, + { + "text": "yourself", + "start": 130.44, + "end": 130.92, + "confidence": 0.988 + }, + { + "text": "My", + "start": 130.92, + "end": 131.74, + "confidence": 0.496 + }, + { + "text": "enemy", + "start": 131.74, + "end": 132.32, + "confidence": 0.989 + } + ] + }, + { + "id": 14, + "seek": 11312, + "start": 133.7, + "end": 137.14, + "text": " Look out for yourself", + "tokens": [ + 2053, + 484, + 337, + 1803 + ], + "temperature": 0.0, + "avg_logprob": -0.2736021077857827, + "compression_ratio": 1.6610169491525424, + "no_speech_prob": 0.8637643456459045, + "confidence": 0.97, + "words": [ + { + "text": "Look", + "start": 133.7, + "end": 134.62, + "confidence": 0.907 + }, + { + "text": "out", + "start": 134.62, + "end": 136.52, + "confidence": 0.978 + }, + { + "text": "for", + "start": 136.52, + "end": 136.66, + "confidence": 0.999 + }, + { + "text": "yourself", + "start": 136.66, + "end": 137.14, + "confidence": 0.999 + } + ] + }, + { + "id": 15, + "seek": 11312, + "start": 137.64, + "end": 140.16, + "text": " Look, okay I'm hoping that somebody pray for me", + "tokens": [ + 2053, + 11, + 1392, + 286, + 478, + 7159, + 300, + 2618, + 3690, + 337, + 385 + ], + "temperature": 0.0, + "avg_logprob": -0.2736021077857827, + "compression_ratio": 1.6610169491525424, + "no_speech_prob": 0.8637643456459045, + "confidence": 0.786, + "words": [ + { + "text": "Look,", + "start": 137.64, + "end": 138.46, + "confidence": 0.727 + }, + { + "text": "okay", + "start": 138.46, + "end": 138.62, + "confidence": 0.727 + }, + { + "text": "I'm", + "start": 138.62, + "end": 138.88, + "confidence": 0.698 + }, + { + "text": "hoping", + "start": 138.88, + "end": 139.14, + "confidence": 0.501 + }, + { + "text": "that", + "start": 139.14, + "end": 139.34, + "confidence": 0.958 + }, + { + "text": "somebody", + "start": 139.34, + "end": 139.52, + "confidence": 0.981 + }, + { + "text": "pray", + "start": 139.52, + "end": 139.8, + "confidence": 0.821 + }, + { + "text": "for", + "start": 139.8, + "end": 140.04, + "confidence": 0.9 + }, + { + "text": "me", + "start": 140.04, + "end": 140.16, + "confidence": 0.999 + } + ] + }, + { + "id": 16, + "seek": 14012, + "start": 140.18, + "end": 141.7, + "text": " I'm praying that somebody hold for me.", + "tokens": [ + 286, + 478, + 15611, + 300, + 2618, + 1797, + 337, + 385, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.3642334662543403, + "compression_ratio": 1.7333333333333334, + "no_speech_prob": 0.7768110036849976, + "confidence": 0.795, + "words": [ + { + "text": "I'm", + "start": 140.18, + "end": 140.38, + "confidence": 0.819 + }, + { + "text": "praying", + "start": 140.38, + "end": 140.62, + "confidence": 0.694 + }, + { + "text": "that", + "start": 140.62, + "end": 140.82, + "confidence": 0.786 + }, + { + "text": "somebody", + "start": 140.82, + "end": 141.08, + "confidence": 0.985 + }, + { + "text": "hold", + "start": 141.08, + "end": 141.32, + "confidence": 0.447 + }, + { + "text": "for", + "start": 141.32, + "end": 141.52, + "confidence": 0.993 + }, + { + "text": "me.", + "start": 141.52, + "end": 141.7, + "confidence": 0.999 + } + ] + }, + { + "id": 17, + "seek": 14012, + "start": 141.72, + "end": 143.43, + "text": " I'm staying where nobody's supposed to be.", + "tokens": [ + 286, + 478, + 7939, + 689, + 5079, + 311, + 3442, + 281, + 312, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.3642334662543403, + "compression_ratio": 1.7333333333333334, + "no_speech_prob": 0.7768110036849976, + "confidence": 0.853, + "words": [ + { + "text": "I'm", + "start": 141.72, + "end": 141.9, + "confidence": 0.976 + }, + { + "text": "staying", + "start": 141.9, + "end": 142.12, + "confidence": 0.708 + }, + { + "text": "where", + "start": 142.12, + "end": 142.3, + "confidence": 0.906 + }, + { + "text": "nobody's", + "start": 142.3, + "end": 142.88, + "confidence": 0.654 + }, + { + "text": "supposed", + "start": 142.88, + "end": 142.92, + "confidence": 0.924 + }, + { + "text": "to", + "start": 142.92, + "end": 143.12, + "confidence": 0.992 + }, + { + "text": "be.", + "start": 143.12, + "end": 143.43, + "confidence": 0.997 + } + ] + }, + { + "id": 18, + "seek": 14012, + "start": 143.43, + "end": 145.29, + "text": " I propose to be in a wreck of emotions.", + "tokens": [ + 286, + 17421, + 281, + 312, + 294, + 257, + 21478, + 295, + 8462, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.3642334662543403, + "compression_ratio": 1.7333333333333334, + "no_speech_prob": 0.7768110036849976, + "confidence": 0.645, + "words": [ + { + "text": "I", + "start": 143.43, + "end": 143.47, + "confidence": 0.492 + }, + { + "text": "propose", + "start": 143.47, + "end": 143.66, + "confidence": 0.332 + }, + { + "text": "to", + "start": 143.66, + "end": 143.84, + "confidence": 0.78 + }, + { + "text": "be", + "start": 143.84, + "end": 144.04, + "confidence": 0.442 + }, + { + "text": "in", + "start": 144.04, + "end": 144.16, + "confidence": 0.81 + }, + { + "text": "a", + "start": 144.16, + "end": 144.24, + "confidence": 0.555 + }, + { + "text": "wreck", + "start": 144.24, + "end": 144.36, + "confidence": 0.81 + }, + { + "text": "of", + "start": 144.36, + "end": 144.54, + "confidence": 0.99 + }, + { + "text": "emotions.", + "start": 144.54, + "end": 145.29, + "confidence": 0.953 + } + ] + }, + { + "id": 19, + "seek": 14012, + "start": 145.29, + "end": 146.56, + "text": " Ready to go whenever you let me know.", + "tokens": [ + 9944, + 281, + 352, + 5699, + 291, + 718, + 385, + 458, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.3642334662543403, + "compression_ratio": 1.7333333333333334, + "no_speech_prob": 0.7768110036849976, + "confidence": 0.834, + "words": [ + { + "text": "Ready", + "start": 145.29, + "end": 145.33, + "confidence": 0.951 + }, + { + "text": "to", + "start": 145.33, + "end": 145.5, + "confidence": 0.997 + }, + { + "text": "go", + "start": 145.5, + "end": 145.56, + "confidence": 0.997 + }, + { + "text": "whenever", + "start": 145.56, + "end": 145.76, + "confidence": 0.659 + }, + { + "text": "you", + "start": 145.76, + "end": 145.92, + "confidence": 0.403 + }, + { + "text": "let", + "start": 145.92, + "end": 146.04, + "confidence": 0.952 + }, + { + "text": "me", + "start": 146.04, + "end": 146.16, + "confidence": 0.998 + }, + { + "text": "know.", + "start": 146.16, + "end": 146.56, + "confidence": 0.977 + } + ] + }, + { + "id": 20, + "seek": 14012, + "start": 146.56, + "end": 147.86, + "text": " The road is long, so put the pedal into the flow.", + "tokens": [ + 440, + 3060, + 307, + 938, + 11, + 370, + 829, + 264, + 19122, + 666, + 264, + 3095, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.3642334662543403, + "compression_ratio": 1.7333333333333334, + "no_speech_prob": 0.7768110036849976, + "confidence": 0.959, + "words": [ + { + "text": "The", + "start": 146.56, + "end": 146.6, + "confidence": 0.99 + }, + { + "text": "road", + "start": 146.6, + "end": 146.66, + "confidence": 0.99 + }, + { + "text": "is", + "start": 146.66, + "end": 146.74, + "confidence": 0.987 + }, + { + "text": "long,", + "start": 146.74, + "end": 146.96, + "confidence": 0.961 + }, + { + "text": "so", + "start": 146.96, + "end": 147.02, + "confidence": 0.968 + }, + { + "text": "put", + "start": 147.02, + "end": 147.14, + "confidence": 0.954 + }, + { + "text": "the", + "start": 147.14, + "end": 147.28, + "confidence": 0.972 + }, + { + "text": "pedal", + "start": 147.28, + "end": 147.38, + "confidence": 0.993 + }, + { + "text": "into", + "start": 147.38, + "end": 147.58, + "confidence": 0.898 + }, + { + "text": "the", + "start": 147.58, + "end": 147.74, + "confidence": 0.992 + }, + { + "text": "flow.", + "start": 147.74, + "end": 147.86, + "confidence": 0.857 + } + ] + }, + { + "id": 21, + "seek": 14012, + "start": 147.94, + "end": 150.22, + "text": " The enemy on my trail, my energy unavailable.", + "tokens": [ + 440, + 5945, + 322, + 452, + 9924, + 11, + 452, + 2281, + 36541, + 32699, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.3642334662543403, + "compression_ratio": 1.7333333333333334, + "no_speech_prob": 0.7768110036849976, + "confidence": 0.949, + "words": [ + { + "text": "The", + "start": 147.94, + "end": 148.06, + "confidence": 0.968 + }, + { + "text": "enemy", + "start": 148.06, + "end": 148.24, + "confidence": 0.727 + }, + { + "text": "on", + "start": 148.24, + "end": 148.44, + "confidence": 0.974 + }, + { + "text": "my", + "start": 148.44, + "end": 148.5, + "confidence": 0.974 + }, + { + "text": "trail,", + "start": 148.5, + "end": 148.72, + "confidence": 0.986 + }, + { + "text": "my", + "start": 148.72, + "end": 148.82, + "confidence": 0.99 + }, + { + "text": "energy", + "start": 148.82, + "end": 149.06, + "confidence": 0.996 + }, + { + "text": "unavailable.", + "start": 149.06, + "end": 150.22, + "confidence": 0.978 + } + ] + }, + { + "id": 22, + "seek": 14012, + "start": 150.22, + "end": 151.35, + "text": " I'ma tell them I said away, go away.", + "tokens": [ + 286, + 478, + 64, + 980, + 552, + 286, + 848, + 1314, + 11, + 352, + 1314, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.3642334662543403, + "compression_ratio": 1.7333333333333334, + "no_speech_prob": 0.7768110036849976, + "confidence": 0.571, + "words": [ + { + "text": "I'ma", + "start": 150.22, + "end": 150.26, + "confidence": 0.767 + }, + { + "text": "tell", + "start": 150.26, + "end": 150.36, + "confidence": 0.989 + }, + { + "text": "them", + "start": 150.36, + "end": 150.5, + "confidence": 0.336 + }, + { + "text": "I", + "start": 150.5, + "end": 150.58, + "confidence": 0.358 + }, + { + "text": "said", + "start": 150.58, + "end": 150.74, + "confidence": 0.3 + }, + { + "text": "away,", + "start": 150.74, + "end": 151.14, + "confidence": 0.323 + }, + { + "text": "go", + "start": 151.14, + "end": 151.18, + "confidence": 0.911 + }, + { + "text": "away.", + "start": 151.18, + "end": 151.35, + "confidence": 0.781 + } + ] + }, + { + "id": 23, + "seek": 14012, + "start": 151.35, + "end": 152.78, + "text": " When I'm plotting, I'ma drive to the top.", + "tokens": [ + 1133, + 286, + 478, + 41178, + 11, + 286, + 478, + 64, + 3332, + 281, + 264, + 1192, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.3642334662543403, + "compression_ratio": 1.7333333333333334, + "no_speech_prob": 0.7768110036849976, + "confidence": 0.645, + "words": [ + { + "text": "When", + "start": 151.35, + "end": 151.54, + "confidence": 0.884 + }, + { + "text": "I'm", + "start": 151.54, + "end": 151.72, + "confidence": 0.594 + }, + { + "text": "plotting,", + "start": 151.72, + "end": 151.92, + "confidence": 0.367 + }, + { + "text": "I'ma", + "start": 151.92, + "end": 152.04, + "confidence": 0.488 + }, + { + "text": "drive", + "start": 152.04, + "end": 152.14, + "confidence": 0.621 + }, + { + "text": "to", + "start": 152.14, + "end": 152.32, + "confidence": 0.984 + }, + { + "text": "the", + "start": 152.32, + "end": 152.38, + "confidence": 0.997 + }, + { + "text": "top.", + "start": 152.38, + "end": 152.78, + "confidence": 0.999 + } + ] + }, + { + "id": 24, + "seek": 14012, + "start": 152.78, + "end": 153.76, + "text": " I've been out of shape, thinking out of the box.", + "tokens": [ + 286, + 600, + 668, + 484, + 295, + 3909, + 11, + 1953, + 484, + 295, + 264, + 2424, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.3642334662543403, + "compression_ratio": 1.7333333333333334, + "no_speech_prob": 0.7768110036849976, + "confidence": 0.769, + "words": [ + { + "text": "I've", + "start": 152.78, + "end": 152.82, + "confidence": 0.721 + }, + { + "text": "been", + "start": 152.82, + "end": 152.86, + "confidence": 0.998 + }, + { + "text": "out", + "start": 152.86, + "end": 152.9, + "confidence": 0.905 + }, + { + "text": "of", + "start": 152.9, + "end": 152.96, + "confidence": 0.986 + }, + { + "text": "shape,", + "start": 152.96, + "end": 153.12, + "confidence": 0.998 + }, + { + "text": "thinking", + "start": 153.12, + "end": 153.3, + "confidence": 0.842 + }, + { + "text": "out", + "start": 153.3, + "end": 153.48, + "confidence": 0.347 + }, + { + "text": "of", + "start": 153.48, + "end": 153.54, + "confidence": 0.507 + }, + { + "text": "the", + "start": 153.54, + "end": 153.58, + "confidence": 0.819 + }, + { + "text": "box.", + "start": 153.58, + "end": 153.76, + "confidence": 0.998 + } + ] + }, + { + "id": 25, + "seek": 14012, + "start": 153.76, + "end": 155.34, + "text": " I'm an astronaut, blasted off the planet.", + "tokens": [ + 286, + 478, + 364, + 18516, + 11, + 12035, + 292, + 766, + 264, + 5054, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.3642334662543403, + "compression_ratio": 1.7333333333333334, + "no_speech_prob": 0.7768110036849976, + "confidence": 0.967, + "words": [ + { + "text": "I'm", + "start": 153.76, + "end": 153.9, + "confidence": 0.996 + }, + { + "text": "an", + "start": 153.9, + "end": 153.98, + "confidence": 0.996 + }, + { + "text": "astronaut,", + "start": 153.98, + "end": 154.68, + "confidence": 0.991 + }, + { + "text": "blasted", + "start": 154.68, + "end": 154.86, + "confidence": 0.895 + }, + { + "text": "off", + "start": 154.86, + "end": 155.0, + "confidence": 0.987 + }, + { + "text": "the", + "start": 155.0, + "end": 155.16, + "confidence": 0.959 + }, + { + "text": "planet.", + "start": 155.16, + "end": 155.34, + "confidence": 0.997 + } + ] + }, + { + "id": 26, + "seek": 14012, + "start": 155.36, + "end": 157.11, + "text": " Rock the cars, catastrophic, and it matters more", + "tokens": [ + 6922, + 264, + 5163, + 11, + 34915, + 11, + 293, + 309, + 7001, + 544 + ], + "temperature": 0.0, + "avg_logprob": -0.3642334662543403, + "compression_ratio": 1.7333333333333334, + "no_speech_prob": 0.7768110036849976, + "confidence": 0.703, + "words": [ + { + "text": "Rock", + "start": 155.36, + "end": 155.56, + "confidence": 0.563 + }, + { + "text": "the", + "start": 155.56, + "end": 155.7, + "confidence": 0.504 + }, + { + "text": "cars,", + "start": 155.7, + "end": 156.36, + "confidence": 0.472 + }, + { + "text": "catastrophic,", + "start": 156.36, + "end": 156.4, + "confidence": 0.77 + }, + { + "text": "and", + "start": 156.4, + "end": 156.62, + "confidence": 0.925 + }, + { + "text": "it", + "start": 156.62, + "end": 156.7, + "confidence": 0.73 + }, + { + "text": "matters", + "start": 156.7, + "end": 156.94, + "confidence": 0.874 + }, + { + "text": "more", + "start": 156.94, + "end": 157.11, + "confidence": 0.973 + } + ] + }, + { + "id": 27, + "seek": 14012, + "start": 157.11, + "end": 157.93, + "text": " because I had it now.", + "tokens": [ + 570, + 286, + 632, + 309, + 586, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.3642334662543403, + "compression_ratio": 1.7333333333333334, + "no_speech_prob": 0.7768110036849976, + "confidence": 0.648, + "words": [ + { + "text": "because", + "start": 157.11, + "end": 157.38, + "confidence": 0.99 + }, + { + "text": "I", + "start": 157.38, + "end": 157.56, + "confidence": 0.528 + }, + { + "text": "had", + "start": 157.56, + "end": 157.68, + "confidence": 0.935 + }, + { + "text": "it", + "start": 157.68, + "end": 157.76, + "confidence": 0.984 + }, + { + "text": "now.", + "start": 157.76, + "end": 157.93, + "confidence": 0.237 + } + ] + }, + { + "id": 28, + "seek": 14012, + "start": 157.93, + "end": 160.1, + "text": " Had I thought about wreaking havoc on an opposition.", + "tokens": [ + 12298, + 286, + 1194, + 466, + 46674, + 2456, + 47367, + 322, + 364, + 13504, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.3642334662543403, + "compression_ratio": 1.7333333333333334, + "no_speech_prob": 0.7768110036849976, + "confidence": 0.955, + "words": [ + { + "text": "Had", + "start": 157.93, + "end": 158.12, + "confidence": 0.852 + }, + { + "text": "I", + "start": 158.12, + "end": 158.2, + "confidence": 0.971 + }, + { + "text": "thought", + "start": 158.2, + "end": 158.4, + "confidence": 0.991 + }, + { + "text": "about", + "start": 158.4, + "end": 158.58, + "confidence": 0.995 + }, + { + "text": "wreaking", + "start": 158.58, + "end": 158.84, + "confidence": 0.996 + }, + { + "text": "havoc", + "start": 158.84, + "end": 159.08, + "confidence": 1.0 + }, + { + "text": "on", + "start": 159.08, + "end": 159.28, + "confidence": 0.861 + }, + { + "text": "an", + "start": 159.28, + "end": 159.44, + "confidence": 0.913 + }, + { + "text": "opposition.", + "start": 159.44, + "end": 160.1, + "confidence": 0.991 + } + ] + }, + { + "id": 29, + "seek": 14012, + "start": 160.1, + "end": 161.04, + "text": " Kind of shocking, they want it static.", + "tokens": [ + 9242, + 295, + 18776, + 11, + 436, + 528, + 309, + 13437, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.3642334662543403, + "compression_ratio": 1.7333333333333334, + "no_speech_prob": 0.7768110036849976, + "confidence": 0.666, + "words": [ + { + "text": "Kind", + "start": 160.1, + "end": 160.14, + "confidence": 0.663 + }, + { + "text": "of", + "start": 160.14, + "end": 160.22, + "confidence": 0.995 + }, + { + "text": "shocking,", + "start": 160.22, + "end": 160.5, + "confidence": 0.656 + }, + { + "text": "they", + "start": 160.5, + "end": 160.58, + "confidence": 0.366 + }, + { + "text": "want", + "start": 160.58, + "end": 160.74, + "confidence": 0.573 + }, + { + "text": "it", + "start": 160.74, + "end": 160.84, + "confidence": 0.648 + }, + { + "text": "static.", + "start": 160.84, + "end": 161.04, + "confidence": 0.993 + } + ] + }, + { + "id": 30, + "seek": 14012, + "start": 161.06, + "end": 162.14, + "text": " With precision, I'm automatic.", + "tokens": [ + 2022, + 18356, + 11, + 286, + 478, + 12509, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.3642334662543403, + "compression_ratio": 1.7333333333333334, + "no_speech_prob": 0.7768110036849976, + "confidence": 0.875, + "words": [ + { + "text": "With", + "start": 161.06, + "end": 161.24, + "confidence": 0.59 + }, + { + "text": "precision,", + "start": 161.24, + "end": 161.72, + "confidence": 0.904 + }, + { + "text": "I'm", + "start": 161.72, + "end": 161.78, + "confidence": 0.987 + }, + { + "text": "automatic.", + "start": 161.78, + "end": 162.14, + "confidence": 0.987 + } + ] + }, + { + "id": 31, + "seek": 14012, + "start": 162.24, + "end": 163.36, + "text": " Quarterback, I ain't talking second.", + "tokens": [ + 43794, + 3207, + 11, + 286, + 7862, + 380, + 1417, + 1150, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.3642334662543403, + "compression_ratio": 1.7333333333333334, + "no_speech_prob": 0.7768110036849976, + "confidence": 0.688, + "words": [ + { + "text": "Quarterback,", + "start": 162.24, + "end": 162.66, + "confidence": 0.513 + }, + { + "text": "I", + "start": 162.66, + "end": 162.78, + "confidence": 0.965 + }, + { + "text": "ain't", + "start": 162.78, + "end": 162.86, + "confidence": 0.99 + }, + { + "text": "talking", + "start": 162.86, + "end": 163.1, + "confidence": 0.892 + }, + { + "text": "second.", + "start": 163.1, + "end": 163.36, + "confidence": 0.328 + } + ] + }, + { + "id": 32, + "seek": 14012, + "start": 163.4, + "end": 164.17, + "text": " Pack it, pack it up.", + "tokens": [ + 18466, + 309, + 11, + 2844, + 309, + 493, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.3642334662543403, + "compression_ratio": 1.7333333333333334, + "no_speech_prob": 0.7768110036849976, + "confidence": 0.973, + "words": [ + { + "text": "Pack", + "start": 163.4, + "end": 163.6, + "confidence": 0.968 + }, + { + "text": "it,", + "start": 163.6, + "end": 163.68, + "confidence": 0.937 + }, + { + "text": "pack", + "start": 163.68, + "end": 163.84, + "confidence": 0.986 + }, + { + "text": "it", + "start": 163.84, + "end": 163.98, + "confidence": 0.999 + }, + { + "text": "up.", + "start": 163.98, + "end": 164.17, + "confidence": 0.979 + } + ] + }, + { + "id": 33, + "seek": 14012, + "start": 164.17, + "end": 165.1, + "text": " I don't panic, better, better.", + "tokens": [ + 286, + 500, + 380, + 14783, + 11, + 1101, + 11, + 1101, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.3642334662543403, + "compression_ratio": 1.7333333333333334, + "no_speech_prob": 0.7768110036849976, + "confidence": 0.76, + "words": [ + { + "text": "I", + "start": 164.17, + "end": 164.21, + "confidence": 0.984 + }, + { + "text": "don't", + "start": 164.21, + "end": 164.34, + "confidence": 0.913 + }, + { + "text": "panic,", + "start": 164.34, + "end": 164.8, + "confidence": 0.999 + }, + { + "text": "better,", + "start": 164.8, + "end": 164.84, + "confidence": 0.423 + }, + { + "text": "better.", + "start": 164.84, + "end": 165.1, + "confidence": 0.556 + } + ] + }, + { + "id": 34, + "seek": 14012, + "start": 165.16, + "end": 165.76, + "text": " Up who the baddest.", + "tokens": [ + 5858, + 567, + 264, + 1578, + 23748, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.3642334662543403, + "compression_ratio": 1.7333333333333334, + "no_speech_prob": 0.7768110036849976, + "confidence": 0.752, + "words": [ + { + "text": "Up", + "start": 165.16, + "end": 165.24, + "confidence": 0.518 + }, + { + "text": "who", + "start": 165.24, + "end": 165.38, + "confidence": 0.751 + }, + { + "text": "the", + "start": 165.38, + "end": 165.52, + "confidence": 0.926 + }, + { + "text": "baddest.", + "start": 165.52, + "end": 165.76, + "confidence": 0.817 + } + ] + }, + { + "id": 35, + "seek": 16572, + "start": 165.76, + "end": 166.86, + "text": " it don't matter cause we is your enemy.", + "tokens": [ + 50364, + 309, + 500, + 380, + 1871, + 3082, + 321, + 307, + 428, + 5945, + 13, + 50414 + ], + "temperature": 0.0, + "avg_logprob": -0.910880969120906, + "compression_ratio": 0.8297872340425532, + "no_speech_prob": 0.6945543885231018, + "confidence": 0.448, + "words": [ + { + "text": "it", + "start": 165.76, + "end": 165.86, + "confidence": 0.124 + }, + { + "text": "don't", + "start": 165.86, + "end": 166.18, + "confidence": 0.825 + }, + { + "text": "matter", + "start": 166.18, + "end": 166.22, + "confidence": 0.996 + }, + { + "text": "cause", + "start": 166.22, + "end": 166.4, + "confidence": 0.287 + }, + { + "text": "we", + "start": 166.4, + "end": 166.5, + "confidence": 0.889 + }, + { + "text": "is", + "start": 166.5, + "end": 166.68, + "confidence": 0.231 + }, + { + "text": "your", + "start": 166.68, + "end": 166.74, + "confidence": 0.562 + }, + { + "text": "enemy.", + "start": 166.74, + "end": 166.86, + "confidence": 0.258 + } + ] + }, + { + "id": 36, + "seek": 19572, + "start": 196.18, + "end": 198.2, + "text": " I swear I'll never be insane", + "tokens": [ + 286, + 11902, + 286, + 603, + 1128, + 312, + 10838 + ], + "temperature": 0.0, + "avg_logprob": -0.5786522030830383, + "compression_ratio": 1.0, + "no_speech_prob": 0.756009578704834, + "confidence": 0.75, + "words": [ + { + "text": "I", + "start": 196.18, + "end": 196.4, + "confidence": 0.623 + }, + { + "text": "swear", + "start": 196.4, + "end": 196.66, + "confidence": 0.959 + }, + { + "text": "I'll", + "start": 196.66, + "end": 197.2, + "confidence": 0.643 + }, + { + "text": "never", + "start": 197.2, + "end": 197.5, + "confidence": 0.997 + }, + { + "text": "be", + "start": 197.5, + "end": 197.84, + "confidence": 0.993 + }, + { + "text": "insane", + "start": 197.84, + "end": 198.2, + "confidence": 0.546 + } + ] + }, + { + "id": 37, + "seek": 19772, + "start": 198.38, + "end": 199.72, + "text": " You got to be yourself", + "tokens": [ + 50364, + 509, + 658, + 281, + 312, + 1803, + 50464 + ], + "temperature": 0.0, + "avg_logprob": -0.7925397753715515, + "compression_ratio": 0.7333333333333333, + "no_speech_prob": 0.7818466424942017, + "confidence": 0.406, + "words": [ + { + "text": "You", + "start": 198.38, + "end": 198.54, + "confidence": 0.093 + }, + { + "text": "got", + "start": 198.54, + "end": 198.8, + "confidence": 0.199 + }, + { + "text": "to", + "start": 198.8, + "end": 198.98, + "confidence": 0.803 + }, + { + "text": "be", + "start": 198.98, + "end": 199.08, + "confidence": 0.826 + }, + { + "text": "yourself", + "start": 199.08, + "end": 199.72, + "confidence": 0.903 + } + ] + } + ], + "language": "en" +} \ No newline at end of file diff --git a/tests/expected/corner_cases.cpu/random.nocond_apollo11.mp3.words.json b/tests/expected/corner_cases.cpu/random.nocond_apollo11.mp3.words.json new file mode 100644 index 0000000000000000000000000000000000000000..411722411d7434ca27a340d8cf4629331e376df9 --- /dev/null +++ b/tests/expected/corner_cases.cpu/random.nocond_apollo11.mp3.words.json @@ -0,0 +1,1192 @@ +{ + "text": " Apollo 11, Houston we got a recommendation for you on your Soyuz-VA GLEME GVA. All right. Okay, we like to say that they make it one or two on the helmet. We're going to have a B1 and you can put the other one on the mic helmet with those GVA blizzard frames. We were going to hack me on the ground with a cover. I tried it already. Okay, fine. We weren't sure of that. Just a suggestion. We thought we'd get you to check it out. I'm not sure if you've already turned that. So I guess we're going to come up with this. Let us know. Okay, no problem. Okay, no problem. No problem. No one at the end of the line.", + "segments": [ + { + "id": 0, + "seek": 0, + "start": 0.64, + "end": 6.68, + "text": " Apollo 11, Houston we got a recommendation for you on your Soyuz-VA GLEME GVA.", + "tokens": [ + 25187, + 2975, + 11, + 18717, + 321, + 658, + 257, + 11879, + 337, + 291, + 322, + 428, + 24758, + 3334, + 12, + 20914, + 460, + 2634, + 15454, + 460, + 20914, + 13 + ], + "temperature": 0.1, + "avg_logprob": -0.709779328937772, + "compression_ratio": 1.3631578947368421, + "no_speech_prob": 0.45045843720436096, + "confidence": 0.542, + "words": [ + { + "text": "Apollo", + "start": 0.64, + "end": 0.98, + "confidence": 0.155 + }, + { + "text": "11,", + "start": 0.98, + "end": 1.54, + "confidence": 0.977 + }, + { + "text": "Houston", + "start": 1.54, + "end": 1.8, + "confidence": 0.986 + }, + { + "text": "we", + "start": 1.8, + "end": 1.98, + "confidence": 0.52 + }, + { + "text": "got", + "start": 1.98, + "end": 2.16, + "confidence": 0.824 + }, + { + "text": "a", + "start": 2.16, + "end": 2.38, + "confidence": 0.989 + }, + { + "text": "recommendation", + "start": 2.38, + "end": 3.1, + "confidence": 0.968 + }, + { + "text": "for", + "start": 3.1, + "end": 3.52, + "confidence": 0.947 + }, + { + "text": "you", + "start": 3.52, + "end": 3.9, + "confidence": 0.984 + }, + { + "text": "on", + "start": 3.9, + "end": 4.28, + "confidence": 0.909 + }, + { + "text": "your", + "start": 4.28, + "end": 4.32, + "confidence": 0.971 + }, + { + "text": "Soyuz-VA", + "start": 4.32, + "end": 5.38, + "confidence": 0.26 + }, + { + "text": "GLEME", + "start": 5.38, + "end": 6.04, + "confidence": 0.478 + }, + { + "text": "GVA.", + "start": 6.04, + "end": 6.68, + "confidence": 0.436 + } + ] + }, + { + "id": 1, + "seek": 0, + "start": 7.5, + "end": 11.0, + "text": " All right.", + "tokens": [ + 1057, + 558, + 13 + ], + "temperature": 0.1, + "avg_logprob": -0.709779328937772, + "compression_ratio": 1.3631578947368421, + "no_speech_prob": 0.45045843720436096, + "confidence": 0.456, + "words": [ + { + "text": "All", + "start": 7.5, + "end": 7.7, + "confidence": 0.212 + }, + { + "text": "right.", + "start": 7.7, + "end": 11.0, + "confidence": 0.982 + } + ] + }, + { + "id": 2, + "seek": 0, + "start": 11.5, + "end": 17.19, + "text": " Okay, we like to say that they make it one or two on the helmet.", + "tokens": [ + 1033, + 11, + 321, + 411, + 281, + 584, + 300, + 436, + 652, + 309, + 472, + 420, + 732, + 322, + 264, + 15922, + 13 + ], + "temperature": 0.1, + "avg_logprob": -0.709779328937772, + "compression_ratio": 1.3631578947368421, + "no_speech_prob": 0.45045843720436096, + "confidence": 0.428, + "words": [ + { + "text": "Okay,", + "start": 11.5, + "end": 12.82, + "confidence": 0.577 + }, + { + "text": "we", + "start": 12.82, + "end": 13.12, + "confidence": 0.541 + }, + { + "text": "like", + "start": 13.12, + "end": 13.44, + "confidence": 0.493 + }, + { + "text": "to", + "start": 13.44, + "end": 13.68, + "confidence": 0.307 + }, + { + "text": "say", + "start": 13.68, + "end": 14.96, + "confidence": 0.172 + }, + { + "text": "that", + "start": 14.96, + "end": 15.56, + "confidence": 0.203 + }, + { + "text": "they", + "start": 15.56, + "end": 15.6, + "confidence": 0.472 + }, + { + "text": "make", + "start": 15.6, + "end": 15.76, + "confidence": 0.378 + }, + { + "text": "it", + "start": 15.76, + "end": 15.96, + "confidence": 0.259 + }, + { + "text": "one", + "start": 15.96, + "end": 16.1, + "confidence": 0.481 + }, + { + "text": "or", + "start": 16.1, + "end": 16.34, + "confidence": 0.221 + }, + { + "text": "two", + "start": 16.34, + "end": 16.46, + "confidence": 0.938 + }, + { + "text": "on", + "start": 16.46, + "end": 16.7, + "confidence": 0.638 + }, + { + "text": "the", + "start": 16.7, + "end": 16.96, + "confidence": 0.885 + }, + { + "text": "helmet.", + "start": 16.96, + "end": 17.19, + "confidence": 0.695 + } + ] + }, + { + "id": 3, + "seek": 0, + "start": 17.19, + "end": 24.74, + "text": " We're going to have a B1 and you can put the other one on the mic helmet with those GVA blizzard frames.", + "tokens": [ + 492, + 434, + 516, + 281, + 362, + 257, + 363, + 16, + 293, + 291, + 393, + 829, + 264, + 661, + 472, + 322, + 264, + 3123, + 15922, + 365, + 729, + 460, + 20914, + 888, + 31062, + 12083, + 13 + ], + "temperature": 0.1, + "avg_logprob": -0.709779328937772, + "compression_ratio": 1.3631578947368421, + "no_speech_prob": 0.45045843720436096, + "confidence": 0.515, + "words": [ + { + "text": "We're", + "start": 17.19, + "end": 17.86, + "confidence": 0.63 + }, + { + "text": "going", + "start": 17.86, + "end": 18.06, + "confidence": 0.62 + }, + { + "text": "to", + "start": 18.06, + "end": 18.24, + "confidence": 0.993 + }, + { + "text": "have", + "start": 18.24, + "end": 18.3, + "confidence": 0.959 + }, + { + "text": "a", + "start": 18.3, + "end": 18.42, + "confidence": 0.32 + }, + { + "text": "B1", + "start": 18.42, + "end": 19.3, + "confidence": 0.799 + }, + { + "text": "and", + "start": 19.3, + "end": 20.18, + "confidence": 0.498 + }, + { + "text": "you", + "start": 20.18, + "end": 20.36, + "confidence": 0.87 + }, + { + "text": "can", + "start": 20.36, + "end": 20.54, + "confidence": 0.672 + }, + { + "text": "put", + "start": 20.54, + "end": 20.72, + "confidence": 0.967 + }, + { + "text": "the", + "start": 20.72, + "end": 20.88, + "confidence": 0.974 + }, + { + "text": "other", + "start": 20.88, + "end": 21.06, + "confidence": 0.995 + }, + { + "text": "one", + "start": 21.06, + "end": 21.26, + "confidence": 0.973 + }, + { + "text": "on", + "start": 21.26, + "end": 21.68, + "confidence": 0.973 + }, + { + "text": "the", + "start": 21.68, + "end": 21.96, + "confidence": 0.585 + }, + { + "text": "mic", + "start": 21.96, + "end": 22.6, + "confidence": 0.48 + }, + { + "text": "helmet", + "start": 22.6, + "end": 22.94, + "confidence": 0.949 + }, + { + "text": "with", + "start": 22.94, + "end": 23.2, + "confidence": 0.444 + }, + { + "text": "those", + "start": 23.2, + "end": 23.5, + "confidence": 0.351 + }, + { + "text": "GVA", + "start": 23.5, + "end": 23.86, + "confidence": 0.169 + }, + { + "text": "blizzard", + "start": 23.86, + "end": 24.32, + "confidence": 0.094 + }, + { + "text": "frames.", + "start": 24.32, + "end": 24.74, + "confidence": 0.245 + } + ] + }, + { + "id": 4, + "seek": 5500, + "start": 56.0, + "end": 61.1, + "text": " We were going to hack me on the ground with a cover.", + "tokens": [ + 492, + 645, + 516, + 281, + 10339, + 385, + 322, + 264, + 2727, + 365, + 257, + 2060, + 13 + ], + "temperature": 0.1, + "avg_logprob": -0.46802620968576203, + "compression_ratio": 1.6418604651162791, + "no_speech_prob": 0.7498895525932312, + "confidence": 0.342, + "words": [ + { + "text": "We", + "start": 56.0, + "end": 56.68, + "confidence": 0.071 + }, + { + "text": "were", + "start": 56.68, + "end": 56.98, + "confidence": 0.177 + }, + { + "text": "going", + "start": 56.98, + "end": 57.2, + "confidence": 0.148 + }, + { + "text": "to", + "start": 57.2, + "end": 57.46, + "confidence": 0.932 + }, + { + "text": "hack", + "start": 57.46, + "end": 57.5, + "confidence": 0.261 + }, + { + "text": "me", + "start": 57.5, + "end": 57.64, + "confidence": 0.544 + }, + { + "text": "on", + "start": 57.64, + "end": 59.2, + "confidence": 0.433 + }, + { + "text": "the", + "start": 59.2, + "end": 59.5, + "confidence": 0.309 + }, + { + "text": "ground", + "start": 59.5, + "end": 59.78, + "confidence": 0.356 + }, + { + "text": "with", + "start": 59.78, + "end": 60.62, + "confidence": 0.471 + }, + { + "text": "a", + "start": 60.62, + "end": 60.78, + "confidence": 0.538 + }, + { + "text": "cover.", + "start": 60.78, + "end": 61.1, + "confidence": 0.855 + } + ] + }, + { + "id": 5, + "seek": 5500, + "start": 61.12, + "end": 61.88, + "text": " I tried it already.", + "tokens": [ + 286, + 3031, + 309, + 1217, + 13 + ], + "temperature": 0.1, + "avg_logprob": -0.46802620968576203, + "compression_ratio": 1.6418604651162791, + "no_speech_prob": 0.7498895525932312, + "confidence": 0.682, + "words": [ + { + "text": "I", + "start": 61.12, + "end": 61.26, + "confidence": 0.407 + }, + { + "text": "tried", + "start": 61.26, + "end": 61.52, + "confidence": 0.889 + }, + { + "text": "it", + "start": 61.52, + "end": 61.7, + "confidence": 0.746 + }, + { + "text": "already.", + "start": 61.7, + "end": 61.88, + "confidence": 0.803 + } + ] + }, + { + "id": 6, + "seek": 5500, + "start": 62.5, + "end": 63.12, + "text": " Okay, fine.", + "tokens": [ + 1033, + 11, + 2489, + 13 + ], + "temperature": 0.1, + "avg_logprob": -0.46802620968576203, + "compression_ratio": 1.6418604651162791, + "no_speech_prob": 0.7498895525932312, + "confidence": 0.683, + "words": [ + { + "text": "Okay,", + "start": 62.5, + "end": 63.04, + "confidence": 0.521 + }, + { + "text": "fine.", + "start": 63.04, + "end": 63.12, + "confidence": 0.895 + } + ] + }, + { + "id": 7, + "seek": 5500, + "start": 63.12, + "end": 64.12, + "text": " We weren't sure of that.", + "tokens": [ + 492, + 4999, + 380, + 988, + 295, + 300, + 13 + ], + "temperature": 0.1, + "avg_logprob": -0.46802620968576203, + "compression_ratio": 1.6418604651162791, + "no_speech_prob": 0.7498895525932312, + "confidence": 0.895, + "words": [ + { + "text": "We", + "start": 63.12, + "end": 63.34, + "confidence": 0.959 + }, + { + "text": "weren't", + "start": 63.34, + "end": 63.62, + "confidence": 0.988 + }, + { + "text": "sure", + "start": 63.62, + "end": 63.82, + "confidence": 0.903 + }, + { + "text": "of", + "start": 63.82, + "end": 64.08, + "confidence": 0.613 + }, + { + "text": "that.", + "start": 64.08, + "end": 64.12, + "confidence": 0.989 + } + ] + }, + { + "id": 8, + "seek": 5500, + "start": 64.46, + "end": 65.2, + "text": " Just a suggestion.", + "tokens": [ + 1449, + 257, + 16541, + 13 + ], + "temperature": 0.1, + "avg_logprob": -0.46802620968576203, + "compression_ratio": 1.6418604651162791, + "no_speech_prob": 0.7498895525932312, + "confidence": 0.755, + "words": [ + { + "text": "Just", + "start": 64.46, + "end": 64.66, + "confidence": 0.545 + }, + { + "text": "a", + "start": 64.66, + "end": 64.76, + "confidence": 0.791 + }, + { + "text": "suggestion.", + "start": 64.76, + "end": 65.2, + "confidence": 0.997 + } + ] + }, + { + "id": 9, + "seek": 5500, + "start": 65.34, + "end": 67.92, + "text": " We thought we'd get you to check it out.", + "tokens": [ + 492, + 1194, + 321, + 1116, + 483, + 291, + 281, + 1520, + 309, + 484, + 13 + ], + "temperature": 0.1, + "avg_logprob": -0.46802620968576203, + "compression_ratio": 1.6418604651162791, + "no_speech_prob": 0.7498895525932312, + "confidence": 0.692, + "words": [ + { + "text": "We", + "start": 65.34, + "end": 65.44, + "confidence": 0.873 + }, + { + "text": "thought", + "start": 65.44, + "end": 65.62, + "confidence": 0.968 + }, + { + "text": "we'd", + "start": 65.62, + "end": 66.76, + "confidence": 0.686 + }, + { + "text": "get", + "start": 66.76, + "end": 67.06, + "confidence": 0.093 + }, + { + "text": "you", + "start": 67.06, + "end": 67.14, + "confidence": 0.823 + }, + { + "text": "to", + "start": 67.14, + "end": 67.32, + "confidence": 0.987 + }, + { + "text": "check", + "start": 67.32, + "end": 67.46, + "confidence": 0.845 + }, + { + "text": "it", + "start": 67.46, + "end": 67.68, + "confidence": 0.991 + }, + { + "text": "out.", + "start": 67.68, + "end": 67.92, + "confidence": 0.997 + } + ] + }, + { + "id": 10, + "seek": 5500, + "start": 68.28, + "end": 69.34, + "text": " I'm not sure if you've already turned that.", + "tokens": [ + 286, + 478, + 406, + 988, + 498, + 291, + 600, + 1217, + 3574, + 300, + 13 + ], + "temperature": 0.1, + "avg_logprob": -0.46802620968576203, + "compression_ratio": 1.6418604651162791, + "no_speech_prob": 0.7498895525932312, + "confidence": 0.444, + "words": [ + { + "text": "I'm", + "start": 68.28, + "end": 68.5, + "confidence": 0.314 + }, + { + "text": "not", + "start": 68.5, + "end": 68.56, + "confidence": 0.319 + }, + { + "text": "sure", + "start": 68.56, + "end": 68.74, + "confidence": 0.82 + }, + { + "text": "if", + "start": 68.74, + "end": 68.78, + "confidence": 0.334 + }, + { + "text": "you've", + "start": 68.78, + "end": 68.84, + "confidence": 0.389 + }, + { + "text": "already", + "start": 68.84, + "end": 68.94, + "confidence": 0.588 + }, + { + "text": "turned", + "start": 68.94, + "end": 69.12, + "confidence": 0.738 + }, + { + "text": "that.", + "start": 69.12, + "end": 69.34, + "confidence": 0.524 + } + ] + }, + { + "id": 11, + "seek": 5500, + "start": 70.42, + "end": 71.98, + "text": " So I guess we're going to come up with this.", + "tokens": [ + 407, + 286, + 2041, + 321, + 434, + 516, + 281, + 808, + 493, + 365, + 341, + 13 + ], + "temperature": 0.1, + "avg_logprob": -0.46802620968576203, + "compression_ratio": 1.6418604651162791, + "no_speech_prob": 0.7498895525932312, + "confidence": 0.709, + "words": [ + { + "text": "So", + "start": 70.42, + "end": 70.5, + "confidence": 0.533 + }, + { + "text": "I", + "start": 70.5, + "end": 70.54, + "confidence": 0.454 + }, + { + "text": "guess", + "start": 70.54, + "end": 70.82, + "confidence": 0.991 + }, + { + "text": "we're", + "start": 70.82, + "end": 71.12, + "confidence": 0.654 + }, + { + "text": "going", + "start": 71.12, + "end": 71.28, + "confidence": 0.815 + }, + { + "text": "to", + "start": 71.28, + "end": 71.36, + "confidence": 0.992 + }, + { + "text": "come", + "start": 71.36, + "end": 71.48, + "confidence": 0.97 + }, + { + "text": "up", + "start": 71.48, + "end": 71.68, + "confidence": 0.958 + }, + { + "text": "with", + "start": 71.68, + "end": 71.92, + "confidence": 0.915 + }, + { + "text": "this.", + "start": 71.92, + "end": 71.98, + "confidence": 0.323 + } + ] + }, + { + "id": 12, + "seek": 5500, + "start": 73.5, + "end": 73.62, + "text": " Let us know.", + "tokens": [ + 961, + 505, + 458, + 13 + ], + "temperature": 0.1, + "avg_logprob": -0.46802620968576203, + "compression_ratio": 1.6418604651162791, + "no_speech_prob": 0.7498895525932312, + "confidence": 0.847, + "words": [ + { + "text": "Let", + "start": 73.5, + "end": 73.54, + "confidence": 0.615 + }, + { + "text": "us", + "start": 73.54, + "end": 73.58, + "confidence": 0.99 + }, + { + "text": "know.", + "start": 73.58, + "end": 73.62, + "confidence": 0.998 + } + ] + }, + { + "id": 13, + "seek": 5500, + "start": 74.22, + "end": 75.22, + "text": " Okay, no problem.", + "tokens": [ + 1033, + 11, + 572, + 1154, + 13 + ], + "temperature": 0.1, + "avg_logprob": -0.46802620968576203, + "compression_ratio": 1.6418604651162791, + "no_speech_prob": 0.7498895525932312, + "confidence": 0.851, + "words": [ + { + "text": "Okay,", + "start": 74.22, + "end": 74.7, + "confidence": 0.687 + }, + { + "text": "no", + "start": 74.7, + "end": 74.86, + "confidence": 0.917 + }, + { + "text": "problem.", + "start": 74.86, + "end": 75.22, + "confidence": 0.976 + } + ] + }, + { + "id": 14, + "seek": 5500, + "start": 75.28, + "end": 76.46, + "text": " Okay, no problem.", + "tokens": [ + 1033, + 11, + 572, + 1154, + 13 + ], + "temperature": 0.1, + "avg_logprob": -0.46802620968576203, + "compression_ratio": 1.6418604651162791, + "no_speech_prob": 0.7498895525932312, + "confidence": 0.623, + "words": [ + { + "text": "Okay,", + "start": 75.28, + "end": 75.98, + "confidence": 0.258 + }, + { + "text": "no", + "start": 75.98, + "end": 76.2, + "confidence": 0.948 + }, + { + "text": "problem.", + "start": 76.2, + "end": 76.46, + "confidence": 0.993 + } + ] + }, + { + "id": 15, + "seek": 7600, + "start": 76.46, + "end": 76.62, + "text": " No problem.", + "tokens": [ + 883, + 1154, + 13 + ], + "temperature": 0.1, + "avg_logprob": -0.7044810771942138, + "compression_ratio": 0.9344262295081968, + "no_speech_prob": 0.35927486419677734, + "confidence": 0.653, + "words": [ + { + "text": "No", + "start": 76.46, + "end": 76.5, + "confidence": 0.463 + }, + { + "text": "problem.", + "start": 76.5, + "end": 76.62, + "confidence": 0.922 + } + ] + }, + { + "id": 16, + "seek": 7700, + "start": 77.02, + "end": 78.32, + "text": " No one at the end of the line.", + "tokens": [ + 50364, + 883, + 472, + 412, + 264, + 917, + 295, + 264, + 1622, + 13, + 50464 + ], + "temperature": 0.1, + "avg_logprob": -0.676593542098999, + "compression_ratio": 0.8823529411764706, + "no_speech_prob": 0.2589211165904999, + "confidence": 0.558, + "words": [ + { + "text": "No", + "start": 77.02, + "end": 77.22, + "confidence": 0.139 + }, + { + "text": "one", + "start": 77.22, + "end": 77.36, + "confidence": 0.335 + }, + { + "text": "at", + "start": 77.36, + "end": 77.44, + "confidence": 0.483 + }, + { + "text": "the", + "start": 77.44, + "end": 77.48, + "confidence": 0.996 + }, + { + "text": "end", + "start": 77.48, + "end": 77.92, + "confidence": 0.995 + }, + { + "text": "of", + "start": 77.92, + "end": 78.1, + "confidence": 0.968 + }, + { + "text": "the", + "start": 78.1, + "end": 78.2, + "confidence": 0.536 + }, + { + "text": "line.", + "start": 78.2, + "end": 78.32, + "confidence": 0.816 + } + ] + } + ], + "language": "English" +} \ No newline at end of file diff --git a/tests/expected/corner_cases.cpu/random_apollo11.mp3.words.json b/tests/expected/corner_cases.cpu/random_apollo11.mp3.words.json new file mode 100644 index 0000000000000000000000000000000000000000..23ccd701318a10a1d5462a5b3b9a55f8ce872217 --- /dev/null +++ b/tests/expected/corner_cases.cpu/random_apollo11.mp3.words.json @@ -0,0 +1,3815 @@ +{ + "text": " Apollo 11, Houston we got a recommendation for you on your Soyuz-EA GLEME GVA. Alright, okay, we like to say that they make the one that's on the helmet we're going to have in B1. And you can put the other one on the mic helmet with those GVA blizzard frames. Alright, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them", + "segments": [ + { + "id": 0, + "seek": 0, + "start": 0.64, + "end": 6.94, + "text": " Apollo 11, Houston we got a recommendation for you on your Soyuz-EA GLEME GVA.", + "tokens": [ + 25187, + 2975, + 11, + 18717, + 321, + 658, + 257, + 11879, + 337, + 291, + 322, + 428, + 24758, + 3334, + 12, + 36, + 32, + 460, + 2634, + 15454, + 460, + 20914, + 13 + ], + "temperature": 0.2, + "avg_logprob": -0.6937426777629109, + "compression_ratio": 1.39247311827957, + "no_speech_prob": 0.45045843720436096, + "confidence": 0.549, + "words": [ + { + "text": "Apollo", + "start": 0.64, + "end": 0.98, + "confidence": 0.155 + }, + { + "text": "11,", + "start": 0.98, + "end": 1.54, + "confidence": 0.977 + }, + { + "text": "Houston", + "start": 1.54, + "end": 1.8, + "confidence": 0.986 + }, + { + "text": "we", + "start": 1.8, + "end": 1.98, + "confidence": 0.52 + }, + { + "text": "got", + "start": 1.98, + "end": 2.16, + "confidence": 0.824 + }, + { + "text": "a", + "start": 2.16, + "end": 2.38, + "confidence": 0.989 + }, + { + "text": "recommendation", + "start": 2.38, + "end": 3.1, + "confidence": 0.968 + }, + { + "text": "for", + "start": 3.1, + "end": 3.52, + "confidence": 0.947 + }, + { + "text": "you", + "start": 3.52, + "end": 3.9, + "confidence": 0.984 + }, + { + "text": "on", + "start": 3.9, + "end": 4.28, + "confidence": 0.909 + }, + { + "text": "your", + "start": 4.28, + "end": 4.32, + "confidence": 0.971 + }, + { + "text": "Soyuz-EA", + "start": 4.32, + "end": 5.42, + "confidence": 0.321 + }, + { + "text": "GLEME", + "start": 5.42, + "end": 6.04, + "confidence": 0.561 + }, + { + "text": "GVA.", + "start": 6.04, + "end": 6.94, + "confidence": 0.336 + } + ] + }, + { + "id": 1, + "seek": 0, + "start": 10.82, + "end": 19.86, + "text": " Alright, okay, we like to say that they make the one that's on the helmet we're going to have in B1.", + "tokens": [ + 2798, + 11, + 1392, + 11, + 321, + 411, + 281, + 584, + 300, + 436, + 652, + 264, + 472, + 300, + 311, + 322, + 264, + 15922, + 321, + 434, + 516, + 281, + 362, + 294, + 363, + 16, + 13 + ], + "temperature": 0.2, + "avg_logprob": -0.6937426777629109, + "compression_ratio": 1.39247311827957, + "no_speech_prob": 0.45045843720436096, + "confidence": 0.469, + "words": [ + { + "text": "Alright,", + "start": 10.82, + "end": 12.5, + "confidence": 0.295 + }, + { + "text": "okay,", + "start": 12.5, + "end": 12.94, + "confidence": 0.513 + }, + { + "text": "we", + "start": 12.94, + "end": 13.12, + "confidence": 0.614 + }, + { + "text": "like", + "start": 13.12, + "end": 13.44, + "confidence": 0.496 + }, + { + "text": "to", + "start": 13.44, + "end": 13.68, + "confidence": 0.26 + }, + { + "text": "say", + "start": 13.68, + "end": 14.98, + "confidence": 0.135 + }, + { + "text": "that", + "start": 14.98, + "end": 15.56, + "confidence": 0.203 + }, + { + "text": "they", + "start": 15.56, + "end": 15.6, + "confidence": 0.425 + }, + { + "text": "make", + "start": 15.6, + "end": 15.76, + "confidence": 0.408 + }, + { + "text": "the", + "start": 15.76, + "end": 15.92, + "confidence": 0.255 + }, + { + "text": "one", + "start": 15.92, + "end": 16.1, + "confidence": 0.609 + }, + { + "text": "that's", + "start": 16.1, + "end": 16.34, + "confidence": 0.447 + }, + { + "text": "on", + "start": 16.34, + "end": 16.62, + "confidence": 0.598 + }, + { + "text": "the", + "start": 16.62, + "end": 16.96, + "confidence": 0.837 + }, + { + "text": "helmet", + "start": 16.96, + "end": 17.36, + "confidence": 0.836 + }, + { + "text": "we're", + "start": 17.36, + "end": 17.86, + "confidence": 0.301 + }, + { + "text": "going", + "start": 17.86, + "end": 18.06, + "confidence": 0.606 + }, + { + "text": "to", + "start": 18.06, + "end": 18.22, + "confidence": 0.818 + }, + { + "text": "have", + "start": 18.22, + "end": 18.26, + "confidence": 0.846 + }, + { + "text": "in", + "start": 18.26, + "end": 18.42, + "confidence": 0.718 + }, + { + "text": "B1.", + "start": 18.42, + "end": 19.86, + "confidence": 0.798 + } + ] + }, + { + "id": 2, + "seek": 0, + "start": 20.1, + "end": 24.76, + "text": " And you can put the other one on the mic helmet with those GVA blizzard frames.", + "tokens": [ + 400, + 291, + 393, + 829, + 264, + 661, + 472, + 322, + 264, + 3123, + 15922, + 365, + 729, + 460, + 20914, + 888, + 31062, + 12083, + 13 + ], + "temperature": 0.2, + "avg_logprob": -0.6937426777629109, + "compression_ratio": 1.39247311827957, + "no_speech_prob": 0.45045843720436096, + "confidence": 0.52, + "words": [ + { + "text": "And", + "start": 20.1, + "end": 20.26, + "confidence": 0.62 + }, + { + "text": "you", + "start": 20.26, + "end": 20.38, + "confidence": 0.948 + }, + { + "text": "can", + "start": 20.38, + "end": 20.54, + "confidence": 0.731 + }, + { + "text": "put", + "start": 20.54, + "end": 20.72, + "confidence": 0.98 + }, + { + "text": "the", + "start": 20.72, + "end": 20.88, + "confidence": 0.989 + }, + { + "text": "other", + "start": 20.88, + "end": 21.06, + "confidence": 0.991 + }, + { + "text": "one", + "start": 21.06, + "end": 21.26, + "confidence": 0.977 + }, + { + "text": "on", + "start": 21.26, + "end": 21.68, + "confidence": 0.989 + }, + { + "text": "the", + "start": 21.68, + "end": 21.96, + "confidence": 0.554 + }, + { + "text": "mic", + "start": 21.96, + "end": 22.58, + "confidence": 0.442 + }, + { + "text": "helmet", + "start": 22.58, + "end": 22.94, + "confidence": 0.842 + }, + { + "text": "with", + "start": 22.94, + "end": 23.2, + "confidence": 0.433 + }, + { + "text": "those", + "start": 23.2, + "end": 23.5, + "confidence": 0.471 + }, + { + "text": "GVA", + "start": 23.5, + "end": 23.88, + "confidence": 0.414 + }, + { + "text": "blizzard", + "start": 23.88, + "end": 24.32, + "confidence": 0.104 + }, + { + "text": "frames.", + "start": 24.32, + "end": 24.76, + "confidence": 0.25 + } + ] + }, + { + "id": 3, + "seek": 2500, + "start": 25.02, + "end": 55.0, + "text": " Alright, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them", + "tokens": [ + 50364, + 2798, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552 + ], + "temperature": 0.2, + "avg_logprob": -0.10773486667209202, + "compression_ratio": 24.096774193548388, + "no_speech_prob": 0.0012825782177969813, + "confidence": 0.936, + "words": [ + { + "text": "Alright,", + "start": 25.02, + "end": 31.98, + "confidence": 0.245 + }, + { + "text": "got", + "start": 31.98, + "end": 32.02, + "confidence": 0.356 + }, + { + "text": "them,", + "start": 32.02, + "end": 32.58, + "confidence": 0.323 + }, + { + "text": "got", + "start": 32.58, + "end": 33.08, + "confidence": 0.519 + }, + { + "text": "them,", + "start": 33.08, + "end": 33.78, + "confidence": 0.941 + }, + { + "text": "got", + "start": 33.78, + "end": 33.82, + "confidence": 0.507 + }, + { + "text": "them,", + "start": 33.82, + "end": 34.12, + "confidence": 0.926 + }, + { + "text": "got", + "start": 34.12, + "end": 34.16, + "confidence": 0.475 + }, + { + "text": "them,", + "start": 34.16, + "end": 34.92, + "confidence": 0.897 + }, + { + "text": "got", + "start": 34.92, + "end": 34.96, + "confidence": 0.597 + }, + { + "text": "them,", + "start": 34.96, + "end": 35.88, + "confidence": 0.914 + }, + { + "text": "got", + "start": 35.88, + "end": 35.92, + "confidence": 0.662 + }, + { + "text": "them,", + "start": 35.92, + "end": 35.96, + "confidence": 0.942 + }, + { + "text": "got", + "start": 35.96, + "end": 36.0, + "confidence": 0.738 + }, + { + "text": "them,", + "start": 36.0, + "end": 36.04, + "confidence": 0.963 + }, + { + "text": "got", + "start": 36.04, + "end": 36.08, + "confidence": 0.819 + }, + { + "text": "them,", + "start": 36.08, + "end": 36.12, + "confidence": 0.974 + }, + { + "text": "got", + "start": 36.12, + "end": 36.16, + "confidence": 0.843 + }, + { + "text": "them,", + "start": 36.16, + "end": 36.2, + "confidence": 0.981 + }, + { + "text": "got", + "start": 36.2, + "end": 36.24, + "confidence": 0.894 + }, + { + "text": "them,", + "start": 36.24, + "end": 36.28, + "confidence": 0.985 + }, + { + "text": "got", + "start": 36.28, + "end": 36.32, + "confidence": 0.918 + }, + { + "text": "them,", + "start": 36.32, + "end": 36.36, + "confidence": 0.987 + }, + { + "text": "got", + "start": 36.36, + "end": 36.4, + "confidence": 0.936 + }, + { + "text": "them,", + "start": 36.4, + "end": 36.44, + "confidence": 0.988 + }, + { + "text": "got", + "start": 36.44, + "end": 36.48, + "confidence": 0.941 + }, + { + "text": "them,", + "start": 36.48, + "end": 36.52, + "confidence": 0.987 + }, + { + "text": "got", + "start": 36.52, + "end": 36.56, + "confidence": 0.943 + }, + { + "text": "them,", + "start": 36.56, + "end": 36.6, + "confidence": 0.99 + }, + { + "text": "got", + "start": 36.6, + "end": 36.64, + "confidence": 0.946 + }, + { + "text": "them,", + "start": 36.64, + "end": 36.68, + "confidence": 0.991 + }, + { + "text": "got", + "start": 36.68, + "end": 36.72, + "confidence": 0.944 + }, + { + "text": "them,", + "start": 36.72, + "end": 36.76, + "confidence": 0.991 + }, + { + "text": "got", + "start": 36.76, + "end": 36.8, + "confidence": 0.944 + }, + { + "text": "them,", + "start": 36.8, + "end": 36.84, + "confidence": 0.991 + }, + { + "text": "got", + "start": 36.84, + "end": 36.88, + "confidence": 0.946 + }, + { + "text": "them,", + "start": 36.88, + "end": 36.92, + "confidence": 0.991 + }, + { + "text": "got", + "start": 36.92, + "end": 36.96, + "confidence": 0.948 + }, + { + "text": "them,", + "start": 36.96, + "end": 37.0, + "confidence": 0.992 + }, + { + "text": "got", + "start": 37.0, + "end": 37.04, + "confidence": 0.953 + }, + { + "text": "them,", + "start": 37.04, + "end": 37.08, + "confidence": 0.992 + }, + { + "text": "got", + "start": 37.08, + "end": 37.12, + "confidence": 0.954 + }, + { + "text": "them,", + "start": 37.12, + "end": 37.16, + "confidence": 0.992 + }, + { + "text": "got", + "start": 37.16, + "end": 37.2, + "confidence": 0.956 + }, + { + "text": "them,", + "start": 37.2, + "end": 37.24, + "confidence": 0.992 + }, + { + "text": "got", + "start": 37.24, + "end": 37.28, + "confidence": 0.957 + }, + { + "text": "them,", + "start": 37.28, + "end": 37.32, + "confidence": 0.992 + }, + { + "text": "got", + "start": 37.32, + "end": 37.36, + "confidence": 0.958 + }, + { + "text": "them,", + "start": 37.36, + "end": 37.4, + "confidence": 0.992 + }, + { + "text": "got", + "start": 37.4, + "end": 37.44, + "confidence": 0.96 + }, + { + "text": "them,", + "start": 37.44, + "end": 37.48, + "confidence": 0.993 + }, + { + "text": "got", + "start": 37.48, + "end": 37.52, + "confidence": 0.961 + }, + { + "text": "them,", + "start": 37.52, + "end": 37.56, + "confidence": 0.993 + }, + { + "text": "got", + "start": 37.56, + "end": 37.6, + "confidence": 0.961 + }, + { + "text": "them,", + "start": 37.6, + "end": 37.64, + "confidence": 0.993 + }, + { + "text": "got", + "start": 37.64, + "end": 37.68, + "confidence": 0.962 + }, + { + "text": "them,", + "start": 37.68, + "end": 37.72, + "confidence": 0.993 + }, + { + "text": "got", + "start": 37.72, + "end": 37.76, + "confidence": 0.965 + }, + { + "text": "them,", + "start": 37.76, + "end": 37.8, + "confidence": 0.993 + }, + { + "text": "got", + "start": 37.8, + "end": 37.84, + "confidence": 0.965 + }, + { + "text": "them,", + "start": 37.84, + "end": 37.88, + "confidence": 0.993 + }, + { + "text": "got", + "start": 37.88, + "end": 37.92, + "confidence": 0.965 + }, + { + "text": "them,", + "start": 37.92, + "end": 37.96, + "confidence": 0.993 + }, + { + "text": "got", + "start": 37.96, + "end": 38.0, + "confidence": 0.968 + }, + { + "text": "them,", + "start": 38.0, + "end": 38.04, + "confidence": 0.993 + }, + { + "text": "got", + "start": 38.04, + "end": 38.08, + "confidence": 0.968 + }, + { + "text": "them,", + "start": 38.08, + "end": 38.12, + "confidence": 0.993 + }, + { + "text": "got", + "start": 38.12, + "end": 38.16, + "confidence": 0.969 + }, + { + "text": "them,", + "start": 38.16, + "end": 38.2, + "confidence": 0.994 + }, + { + "text": "got", + "start": 38.2, + "end": 38.24, + "confidence": 0.971 + }, + { + "text": "them,", + "start": 38.24, + "end": 38.28, + "confidence": 0.994 + }, + { + "text": "got", + "start": 38.28, + "end": 38.32, + "confidence": 0.973 + }, + { + "text": "them,", + "start": 38.32, + "end": 38.36, + "confidence": 0.994 + }, + { + "text": "got", + "start": 38.36, + "end": 38.4, + "confidence": 0.972 + }, + { + "text": "them,", + "start": 38.4, + "end": 38.44, + "confidence": 0.994 + }, + { + "text": "got", + "start": 38.44, + "end": 38.48, + "confidence": 0.973 + }, + { + "text": "them,", + "start": 38.48, + "end": 38.52, + "confidence": 0.994 + }, + { + "text": "got", + "start": 38.52, + "end": 38.56, + "confidence": 0.976 + }, + { + "text": "them,", + "start": 38.56, + "end": 38.6, + "confidence": 0.994 + }, + { + "text": "got", + "start": 38.6, + "end": 38.64, + "confidence": 0.977 + }, + { + "text": "them,", + "start": 38.64, + "end": 38.68, + "confidence": 0.994 + }, + { + "text": "got", + "start": 38.68, + "end": 38.72, + "confidence": 0.979 + }, + { + "text": "them,", + "start": 38.72, + "end": 38.76, + "confidence": 0.994 + }, + { + "text": "got", + "start": 38.76, + "end": 38.8, + "confidence": 0.98 + }, + { + "text": "them,", + "start": 38.8, + "end": 38.84, + "confidence": 0.994 + }, + { + "text": "got", + "start": 38.84, + "end": 38.88, + "confidence": 0.983 + }, + { + "text": "them,", + "start": 38.88, + "end": 38.92, + "confidence": 0.995 + }, + { + "text": "got", + "start": 38.92, + "end": 38.96, + "confidence": 0.984 + }, + { + "text": "them,", + "start": 38.96, + "end": 39.0, + "confidence": 0.995 + }, + { + "text": "got", + "start": 39.0, + "end": 39.04, + "confidence": 0.985 + }, + { + "text": "them,", + "start": 39.04, + "end": 39.08, + "confidence": 0.995 + }, + { + "text": "got", + "start": 39.08, + "end": 39.12, + "confidence": 0.986 + }, + { + "text": "them,", + "start": 39.12, + "end": 39.16, + "confidence": 0.995 + }, + { + "text": "got", + "start": 39.16, + "end": 39.2, + "confidence": 0.987 + }, + { + "text": "them,", + "start": 39.2, + "end": 39.24, + "confidence": 0.995 + }, + { + "text": "got", + "start": 39.24, + "end": 39.28, + "confidence": 0.986 + }, + { + "text": "them,", + "start": 39.28, + "end": 39.32, + "confidence": 0.995 + }, + { + "text": "got", + "start": 39.32, + "end": 39.36, + "confidence": 0.986 + }, + { + "text": "them,", + "start": 39.36, + "end": 39.4, + "confidence": 0.995 + }, + { + "text": "got", + "start": 39.4, + "end": 39.44, + "confidence": 0.988 + }, + { + "text": "them,", + "start": 39.44, + "end": 39.48, + "confidence": 0.995 + }, + { + "text": "got", + "start": 39.48, + "end": 39.52, + "confidence": 0.988 + }, + { + "text": "them,", + "start": 39.52, + "end": 39.56, + "confidence": 0.995 + }, + { + "text": "got", + "start": 39.56, + "end": 39.6, + "confidence": 0.988 + }, + { + "text": "them,", + "start": 39.6, + "end": 39.64, + "confidence": 0.995 + }, + { + "text": "got", + "start": 39.64, + "end": 39.68, + "confidence": 0.989 + }, + { + "text": "them,", + "start": 39.68, + "end": 39.72, + "confidence": 0.995 + }, + { + "text": "got", + "start": 39.72, + "end": 39.76, + "confidence": 0.989 + }, + { + "text": "them,", + "start": 39.76, + "end": 39.8, + "confidence": 0.995 + }, + { + "text": "got", + "start": 39.8, + "end": 39.84, + "confidence": 0.99 + }, + { + "text": "them,", + "start": 39.84, + "end": 39.88, + "confidence": 0.995 + }, + { + "text": "got", + "start": 39.88, + "end": 39.92, + "confidence": 0.99 + }, + { + "text": "them,", + "start": 39.92, + "end": 39.96, + "confidence": 0.995 + }, + { + "text": "got", + "start": 39.96, + "end": 40.0, + "confidence": 0.991 + }, + { + "text": "them,", + "start": 40.0, + "end": 40.04, + "confidence": 0.995 + }, + { + "text": "got", + "start": 40.04, + "end": 40.08, + "confidence": 0.991 + }, + { + "text": "them,", + "start": 40.08, + "end": 40.12, + "confidence": 0.995 + }, + { + "text": "got", + "start": 40.12, + "end": 40.16, + "confidence": 0.992 + }, + { + "text": "them,", + "start": 40.16, + "end": 40.2, + "confidence": 0.995 + }, + { + "text": "got", + "start": 40.2, + "end": 40.24, + "confidence": 0.992 + }, + { + "text": "them,", + "start": 40.24, + "end": 40.28, + "confidence": 0.995 + }, + { + "text": "got", + "start": 40.28, + "end": 40.32, + "confidence": 0.992 + }, + { + "text": "them,", + "start": 40.32, + "end": 40.36, + "confidence": 0.995 + }, + { + "text": "got", + "start": 40.36, + "end": 40.4, + "confidence": 0.992 + }, + { + "text": "them,", + "start": 40.4, + "end": 40.44, + "confidence": 0.995 + }, + { + "text": "got", + "start": 40.44, + "end": 40.48, + "confidence": 0.992 + }, + { + "text": "them,", + "start": 40.48, + "end": 40.52, + "confidence": 0.995 + }, + { + "text": "got", + "start": 40.52, + "end": 40.56, + "confidence": 0.993 + }, + { + "text": "them,", + "start": 40.56, + "end": 40.6, + "confidence": 0.995 + }, + { + "text": "got", + "start": 40.6, + "end": 40.64, + "confidence": 0.993 + }, + { + "text": "them,", + "start": 40.64, + "end": 40.68, + "confidence": 0.995 + }, + { + "text": "got", + "start": 40.68, + "end": 40.72, + "confidence": 0.994 + }, + { + "text": "them,", + "start": 40.72, + "end": 40.76, + "confidence": 0.995 + }, + { + "text": "got", + "start": 40.76, + "end": 40.8, + "confidence": 0.994 + }, + { + "text": "them,", + "start": 40.8, + "end": 40.84, + "confidence": 0.995 + }, + { + "text": "got", + "start": 40.84, + "end": 40.88, + "confidence": 0.994 + }, + { + "text": "them,", + "start": 40.88, + "end": 40.92, + "confidence": 0.996 + }, + { + "text": "got", + "start": 40.92, + "end": 40.96, + "confidence": 0.994 + }, + { + "text": "them,", + "start": 40.96, + "end": 41.0, + "confidence": 0.996 + }, + { + "text": "got", + "start": 41.0, + "end": 41.04, + "confidence": 0.995 + }, + { + "text": "them,", + "start": 41.04, + "end": 41.08, + "confidence": 0.996 + }, + { + "text": "got", + "start": 41.08, + "end": 41.12, + "confidence": 0.995 + }, + { + "text": "them,", + "start": 41.12, + "end": 41.16, + "confidence": 0.996 + }, + { + "text": "got", + "start": 41.16, + "end": 41.2, + "confidence": 0.995 + }, + { + "text": "them,", + "start": 41.2, + "end": 42.94, + "confidence": 0.996 + }, + { + "text": "got", + "start": 42.94, + "end": 46.82, + "confidence": 0.995 + }, + { + "text": "them,", + "start": 46.82, + "end": 47.8, + "confidence": 0.996 + }, + { + "text": "got", + "start": 47.8, + "end": 48.58, + "confidence": 0.995 + }, + { + "text": "them", + "start": 48.58, + "end": 55.0, + "confidence": 0.997 + } + ] + }, + { + "id": 4, + "seek": 5500, + "start": 72.06, + "end": 85.0, + "text": " got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them", + "tokens": [ + 50364, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552 + ], + "temperature": 0.2, + "avg_logprob": -0.053046889369263245, + "compression_ratio": 29.52, + "no_speech_prob": 0.24410122632980347, + "confidence": 0.948, + "words": [ + { + "text": "got", + "start": 72.06, + "end": 72.1, + "confidence": 0.214 + }, + { + "text": "them,", + "start": 72.1, + "end": 72.14, + "confidence": 0.95 + }, + { + "text": "got", + "start": 72.14, + "end": 72.18, + "confidence": 0.954 + }, + { + "text": "them,", + "start": 72.18, + "end": 72.22, + "confidence": 0.997 + }, + { + "text": "got", + "start": 72.22, + "end": 72.26, + "confidence": 0.963 + }, + { + "text": "them,", + "start": 72.26, + "end": 72.3, + "confidence": 0.997 + }, + { + "text": "got", + "start": 72.3, + "end": 72.34, + "confidence": 0.957 + }, + { + "text": "them,", + "start": 72.34, + "end": 72.38, + "confidence": 0.997 + }, + { + "text": "got", + "start": 72.38, + "end": 72.42, + "confidence": 0.938 + }, + { + "text": "them,", + "start": 72.42, + "end": 72.46, + "confidence": 0.993 + }, + { + "text": "got", + "start": 72.46, + "end": 72.5, + "confidence": 0.912 + }, + { + "text": "them,", + "start": 72.5, + "end": 72.54, + "confidence": 0.988 + }, + { + "text": "got", + "start": 72.54, + "end": 72.58, + "confidence": 0.873 + }, + { + "text": "them,", + "start": 72.58, + "end": 72.62, + "confidence": 0.982 + }, + { + "text": "got", + "start": 72.62, + "end": 72.66, + "confidence": 0.863 + }, + { + "text": "them,", + "start": 72.66, + "end": 72.7, + "confidence": 0.984 + }, + { + "text": "got", + "start": 72.7, + "end": 72.74, + "confidence": 0.889 + }, + { + "text": "them,", + "start": 72.74, + "end": 72.78, + "confidence": 0.984 + }, + { + "text": "got", + "start": 72.78, + "end": 72.82, + "confidence": 0.852 + }, + { + "text": "them,", + "start": 72.82, + "end": 72.86, + "confidence": 0.925 + }, + { + "text": "got", + "start": 72.86, + "end": 72.9, + "confidence": 0.56 + }, + { + "text": "them,", + "start": 72.9, + "end": 72.94, + "confidence": 0.958 + }, + { + "text": "got", + "start": 72.94, + "end": 72.98, + "confidence": 0.81 + }, + { + "text": "them,", + "start": 72.98, + "end": 73.02, + "confidence": 0.976 + }, + { + "text": "got", + "start": 73.02, + "end": 73.06, + "confidence": 0.843 + }, + { + "text": "them,", + "start": 73.06, + "end": 73.1, + "confidence": 0.977 + }, + { + "text": "got", + "start": 73.1, + "end": 73.14, + "confidence": 0.835 + }, + { + "text": "them,", + "start": 73.14, + "end": 73.18, + "confidence": 0.977 + }, + { + "text": "got", + "start": 73.18, + "end": 73.22, + "confidence": 0.836 + }, + { + "text": "them,", + "start": 73.22, + "end": 73.26, + "confidence": 0.979 + }, + { + "text": "got", + "start": 73.26, + "end": 73.3, + "confidence": 0.853 + }, + { + "text": "them,", + "start": 73.3, + "end": 73.34, + "confidence": 0.983 + }, + { + "text": "got", + "start": 73.34, + "end": 73.38, + "confidence": 0.874 + }, + { + "text": "them,", + "start": 73.38, + "end": 73.42, + "confidence": 0.986 + }, + { + "text": "got", + "start": 73.42, + "end": 73.46, + "confidence": 0.892 + }, + { + "text": "them,", + "start": 73.46, + "end": 73.5, + "confidence": 0.985 + }, + { + "text": "got", + "start": 73.5, + "end": 73.54, + "confidence": 0.885 + }, + { + "text": "them,", + "start": 73.54, + "end": 73.58, + "confidence": 0.986 + }, + { + "text": "got", + "start": 73.58, + "end": 73.62, + "confidence": 0.877 + }, + { + "text": "them,", + "start": 73.62, + "end": 73.66, + "confidence": 0.986 + }, + { + "text": "got", + "start": 73.66, + "end": 73.7, + "confidence": 0.873 + }, + { + "text": "them,", + "start": 73.7, + "end": 73.74, + "confidence": 0.987 + }, + { + "text": "got", + "start": 73.74, + "end": 73.78, + "confidence": 0.871 + }, + { + "text": "them,", + "start": 73.78, + "end": 73.82, + "confidence": 0.987 + }, + { + "text": "got", + "start": 73.82, + "end": 73.86, + "confidence": 0.88 + }, + { + "text": "them,", + "start": 73.86, + "end": 73.9, + "confidence": 0.988 + }, + { + "text": "got", + "start": 73.9, + "end": 73.94, + "confidence": 0.883 + }, + { + "text": "them,", + "start": 73.94, + "end": 73.98, + "confidence": 0.989 + }, + { + "text": "got", + "start": 73.98, + "end": 74.02, + "confidence": 0.889 + }, + { + "text": "them,", + "start": 74.02, + "end": 74.06, + "confidence": 0.989 + }, + { + "text": "got", + "start": 74.06, + "end": 74.1, + "confidence": 0.895 + }, + { + "text": "them,", + "start": 74.1, + "end": 74.14, + "confidence": 0.99 + }, + { + "text": "got", + "start": 74.14, + "end": 74.18, + "confidence": 0.902 + }, + { + "text": "them,", + "start": 74.18, + "end": 74.22, + "confidence": 0.99 + }, + { + "text": "got", + "start": 74.22, + "end": 74.26, + "confidence": 0.905 + }, + { + "text": "them,", + "start": 74.26, + "end": 74.3, + "confidence": 0.991 + }, + { + "text": "got", + "start": 74.3, + "end": 74.34, + "confidence": 0.911 + }, + { + "text": "them,", + "start": 74.34, + "end": 74.38, + "confidence": 0.991 + }, + { + "text": "got", + "start": 74.38, + "end": 74.42, + "confidence": 0.916 + }, + { + "text": "them,", + "start": 74.42, + "end": 74.46, + "confidence": 0.991 + }, + { + "text": "got", + "start": 74.46, + "end": 74.5, + "confidence": 0.919 + }, + { + "text": "them,", + "start": 74.5, + "end": 74.54, + "confidence": 0.991 + }, + { + "text": "got", + "start": 74.54, + "end": 74.58, + "confidence": 0.922 + }, + { + "text": "them,", + "start": 74.58, + "end": 74.62, + "confidence": 0.992 + }, + { + "text": "got", + "start": 74.62, + "end": 74.66, + "confidence": 0.93 + }, + { + "text": "them,", + "start": 74.66, + "end": 74.7, + "confidence": 0.992 + }, + { + "text": "got", + "start": 74.7, + "end": 74.74, + "confidence": 0.932 + }, + { + "text": "them,", + "start": 74.74, + "end": 74.78, + "confidence": 0.992 + }, + { + "text": "got", + "start": 74.78, + "end": 74.82, + "confidence": 0.937 + }, + { + "text": "them,", + "start": 74.82, + "end": 74.86, + "confidence": 0.992 + }, + { + "text": "got", + "start": 74.86, + "end": 74.9, + "confidence": 0.943 + }, + { + "text": "them,", + "start": 74.9, + "end": 74.94, + "confidence": 0.992 + }, + { + "text": "got", + "start": 74.94, + "end": 74.98, + "confidence": 0.944 + }, + { + "text": "them,", + "start": 74.98, + "end": 75.02, + "confidence": 0.992 + }, + { + "text": "got", + "start": 75.02, + "end": 75.06, + "confidence": 0.95 + }, + { + "text": "them,", + "start": 75.06, + "end": 75.1, + "confidence": 0.992 + }, + { + "text": "got", + "start": 75.1, + "end": 75.14, + "confidence": 0.953 + }, + { + "text": "them,", + "start": 75.14, + "end": 75.18, + "confidence": 0.993 + }, + { + "text": "got", + "start": 75.18, + "end": 75.22, + "confidence": 0.955 + }, + { + "text": "them,", + "start": 75.22, + "end": 75.26, + "confidence": 0.992 + }, + { + "text": "got", + "start": 75.26, + "end": 75.3, + "confidence": 0.956 + }, + { + "text": "them,", + "start": 75.3, + "end": 75.34, + "confidence": 0.992 + }, + { + "text": "got", + "start": 75.34, + "end": 75.38, + "confidence": 0.96 + }, + { + "text": "them,", + "start": 75.38, + "end": 75.42, + "confidence": 0.992 + }, + { + "text": "got", + "start": 75.42, + "end": 75.46, + "confidence": 0.961 + }, + { + "text": "them,", + "start": 75.46, + "end": 75.5, + "confidence": 0.993 + }, + { + "text": "got", + "start": 75.5, + "end": 75.54, + "confidence": 0.961 + }, + { + "text": "them,", + "start": 75.54, + "end": 75.58, + "confidence": 0.992 + }, + { + "text": "got", + "start": 75.58, + "end": 75.62, + "confidence": 0.963 + }, + { + "text": "them,", + "start": 75.62, + "end": 75.66, + "confidence": 0.992 + }, + { + "text": "got", + "start": 75.66, + "end": 75.7, + "confidence": 0.965 + }, + { + "text": "them,", + "start": 75.7, + "end": 75.74, + "confidence": 0.992 + }, + { + "text": "got", + "start": 75.74, + "end": 75.78, + "confidence": 0.967 + }, + { + "text": "them,", + "start": 75.78, + "end": 75.82, + "confidence": 0.992 + }, + { + "text": "got", + "start": 75.82, + "end": 75.86, + "confidence": 0.967 + }, + { + "text": "them,", + "start": 75.86, + "end": 75.9, + "confidence": 0.992 + }, + { + "text": "got", + "start": 75.9, + "end": 75.94, + "confidence": 0.969 + }, + { + "text": "them,", + "start": 75.94, + "end": 75.98, + "confidence": 0.992 + }, + { + "text": "got", + "start": 75.98, + "end": 76.02, + "confidence": 0.97 + }, + { + "text": "them,", + "start": 76.02, + "end": 76.06, + "confidence": 0.992 + }, + { + "text": "got", + "start": 76.06, + "end": 76.1, + "confidence": 0.97 + }, + { + "text": "them,", + "start": 76.1, + "end": 76.14, + "confidence": 0.993 + }, + { + "text": "got", + "start": 76.14, + "end": 76.18, + "confidence": 0.972 + }, + { + "text": "them,", + "start": 76.18, + "end": 76.22, + "confidence": 0.992 + }, + { + "text": "got", + "start": 76.22, + "end": 76.26, + "confidence": 0.973 + }, + { + "text": "them,", + "start": 76.26, + "end": 76.3, + "confidence": 0.992 + }, + { + "text": "got", + "start": 76.3, + "end": 76.34, + "confidence": 0.973 + }, + { + "text": "them,", + "start": 76.34, + "end": 76.38, + "confidence": 0.992 + }, + { + "text": "got", + "start": 76.38, + "end": 76.42, + "confidence": 0.973 + }, + { + "text": "them,", + "start": 76.42, + "end": 76.46, + "confidence": 0.992 + }, + { + "text": "got", + "start": 76.46, + "end": 76.5, + "confidence": 0.974 + }, + { + "text": "them,", + "start": 76.5, + "end": 76.54, + "confidence": 0.992 + }, + { + "text": "got", + "start": 76.54, + "end": 76.58, + "confidence": 0.974 + }, + { + "text": "them,", + "start": 76.58, + "end": 76.62, + "confidence": 0.993 + }, + { + "text": "got", + "start": 76.62, + "end": 76.66, + "confidence": 0.974 + }, + { + "text": "them,", + "start": 76.66, + "end": 76.7, + "confidence": 0.992 + }, + { + "text": "got", + "start": 76.7, + "end": 76.74, + "confidence": 0.976 + }, + { + "text": "them,", + "start": 76.74, + "end": 76.78, + "confidence": 0.992 + }, + { + "text": "got", + "start": 76.78, + "end": 76.82, + "confidence": 0.975 + }, + { + "text": "them,", + "start": 76.82, + "end": 76.86, + "confidence": 0.992 + }, + { + "text": "got", + "start": 76.86, + "end": 76.9, + "confidence": 0.975 + }, + { + "text": "them,", + "start": 76.9, + "end": 76.94, + "confidence": 0.992 + }, + { + "text": "got", + "start": 76.94, + "end": 76.98, + "confidence": 0.976 + }, + { + "text": "them,", + "start": 76.98, + "end": 77.02, + "confidence": 0.993 + }, + { + "text": "got", + "start": 77.02, + "end": 77.06, + "confidence": 0.977 + }, + { + "text": "them,", + "start": 77.06, + "end": 77.1, + "confidence": 0.993 + }, + { + "text": "got", + "start": 77.1, + "end": 77.14, + "confidence": 0.977 + }, + { + "text": "them,", + "start": 77.14, + "end": 77.18, + "confidence": 0.993 + }, + { + "text": "got", + "start": 77.18, + "end": 77.22, + "confidence": 0.977 + }, + { + "text": "them,", + "start": 77.22, + "end": 77.26, + "confidence": 0.993 + }, + { + "text": "got", + "start": 77.26, + "end": 77.3, + "confidence": 0.978 + }, + { + "text": "them,", + "start": 77.3, + "end": 77.34, + "confidence": 0.993 + }, + { + "text": "got", + "start": 77.34, + "end": 77.38, + "confidence": 0.978 + }, + { + "text": "them,", + "start": 77.38, + "end": 77.42, + "confidence": 0.993 + }, + { + "text": "got", + "start": 77.42, + "end": 77.46, + "confidence": 0.978 + }, + { + "text": "them,", + "start": 77.46, + "end": 77.5, + "confidence": 0.993 + }, + { + "text": "got", + "start": 77.5, + "end": 77.54, + "confidence": 0.98 + }, + { + "text": "them,", + "start": 77.54, + "end": 77.58, + "confidence": 0.993 + }, + { + "text": "got", + "start": 77.58, + "end": 77.62, + "confidence": 0.98 + }, + { + "text": "them,", + "start": 77.62, + "end": 77.66, + "confidence": 0.993 + }, + { + "text": "got", + "start": 77.66, + "end": 77.7, + "confidence": 0.98 + }, + { + "text": "them,", + "start": 77.7, + "end": 77.74, + "confidence": 0.993 + }, + { + "text": "got", + "start": 77.74, + "end": 77.78, + "confidence": 0.981 + }, + { + "text": "them,", + "start": 77.78, + "end": 77.82, + "confidence": 0.993 + }, + { + "text": "got", + "start": 77.82, + "end": 77.86, + "confidence": 0.981 + }, + { + "text": "them,", + "start": 77.86, + "end": 79.56, + "confidence": 0.994 + }, + { + "text": "got", + "start": 79.56, + "end": 79.6, + "confidence": 0.981 + }, + { + "text": "them", + "start": 79.6, + "end": 85.0, + "confidence": 0.994 + } + ] + }, + { + "id": 5, + "seek": 8500, + "start": 85.02, + "end": 115.0, + "text": " got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them", + "tokens": [ + 50364, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552 + ], + "temperature": 0.2, + "avg_logprob": -0.04965524716227578, + "compression_ratio": 29.52, + "no_speech_prob": 0.6971923112869263, + "confidence": 0.948, + "words": [ + { + "text": "got", + "start": 85.02, + "end": 85.46, + "confidence": 0.438 + }, + { + "text": "them,", + "start": 85.46, + "end": 86.26, + "confidence": 0.943 + }, + { + "text": "got", + "start": 86.26, + "end": 86.78, + "confidence": 0.963 + }, + { + "text": "them,", + "start": 86.78, + "end": 87.18, + "confidence": 0.992 + }, + { + "text": "got", + "start": 87.18, + "end": 87.8, + "confidence": 0.963 + }, + { + "text": "them,", + "start": 87.8, + "end": 87.84, + "confidence": 0.993 + }, + { + "text": "got", + "start": 87.84, + "end": 88.6, + "confidence": 0.951 + }, + { + "text": "them,", + "start": 88.6, + "end": 88.64, + "confidence": 0.991 + }, + { + "text": "got", + "start": 88.64, + "end": 88.9, + "confidence": 0.934 + }, + { + "text": "them,", + "start": 88.9, + "end": 88.94, + "confidence": 0.988 + }, + { + "text": "got", + "start": 88.94, + "end": 88.98, + "confidence": 0.915 + }, + { + "text": "them,", + "start": 88.98, + "end": 89.02, + "confidence": 0.987 + }, + { + "text": "got", + "start": 89.02, + "end": 89.06, + "confidence": 0.9 + }, + { + "text": "them,", + "start": 89.06, + "end": 89.1, + "confidence": 0.985 + }, + { + "text": "got", + "start": 89.1, + "end": 89.14, + "confidence": 0.899 + }, + { + "text": "them,", + "start": 89.14, + "end": 89.18, + "confidence": 0.985 + }, + { + "text": "got", + "start": 89.18, + "end": 89.22, + "confidence": 0.907 + }, + { + "text": "them,", + "start": 89.22, + "end": 89.26, + "confidence": 0.982 + }, + { + "text": "got", + "start": 89.26, + "end": 89.3, + "confidence": 0.905 + }, + { + "text": "them,", + "start": 89.3, + "end": 89.34, + "confidence": 0.971 + }, + { + "text": "got", + "start": 89.34, + "end": 89.38, + "confidence": 0.866 + }, + { + "text": "them,", + "start": 89.38, + "end": 89.42, + "confidence": 0.959 + }, + { + "text": "got", + "start": 89.42, + "end": 89.46, + "confidence": 0.845 + }, + { + "text": "them,", + "start": 89.46, + "end": 89.5, + "confidence": 0.96 + }, + { + "text": "got", + "start": 89.5, + "end": 89.54, + "confidence": 0.861 + }, + { + "text": "them,", + "start": 89.54, + "end": 89.58, + "confidence": 0.963 + }, + { + "text": "got", + "start": 89.58, + "end": 89.62, + "confidence": 0.88 + }, + { + "text": "them,", + "start": 89.62, + "end": 89.66, + "confidence": 0.965 + }, + { + "text": "got", + "start": 89.66, + "end": 89.7, + "confidence": 0.888 + }, + { + "text": "them,", + "start": 89.7, + "end": 89.74, + "confidence": 0.966 + }, + { + "text": "got", + "start": 89.74, + "end": 89.78, + "confidence": 0.887 + }, + { + "text": "them,", + "start": 89.78, + "end": 89.82, + "confidence": 0.966 + }, + { + "text": "got", + "start": 89.82, + "end": 89.86, + "confidence": 0.875 + }, + { + "text": "them,", + "start": 89.86, + "end": 89.9, + "confidence": 0.968 + }, + { + "text": "got", + "start": 89.9, + "end": 89.94, + "confidence": 0.871 + }, + { + "text": "them,", + "start": 89.94, + "end": 89.98, + "confidence": 0.968 + }, + { + "text": "got", + "start": 89.98, + "end": 90.02, + "confidence": 0.868 + }, + { + "text": "them,", + "start": 90.02, + "end": 90.06, + "confidence": 0.966 + }, + { + "text": "got", + "start": 90.06, + "end": 90.1, + "confidence": 0.865 + }, + { + "text": "them,", + "start": 90.1, + "end": 90.14, + "confidence": 0.964 + }, + { + "text": "got", + "start": 90.14, + "end": 90.18, + "confidence": 0.865 + }, + { + "text": "them,", + "start": 90.18, + "end": 90.22, + "confidence": 0.965 + }, + { + "text": "got", + "start": 90.22, + "end": 90.26, + "confidence": 0.86 + }, + { + "text": "them,", + "start": 90.26, + "end": 90.3, + "confidence": 0.965 + }, + { + "text": "got", + "start": 90.3, + "end": 90.34, + "confidence": 0.867 + }, + { + "text": "them,", + "start": 90.34, + "end": 90.38, + "confidence": 0.966 + }, + { + "text": "got", + "start": 90.38, + "end": 90.42, + "confidence": 0.866 + }, + { + "text": "them,", + "start": 90.42, + "end": 90.46, + "confidence": 0.967 + }, + { + "text": "got", + "start": 90.46, + "end": 90.5, + "confidence": 0.866 + }, + { + "text": "them,", + "start": 90.5, + "end": 90.54, + "confidence": 0.968 + }, + { + "text": "got", + "start": 90.54, + "end": 90.58, + "confidence": 0.87 + }, + { + "text": "them,", + "start": 90.58, + "end": 90.62, + "confidence": 0.969 + }, + { + "text": "got", + "start": 90.62, + "end": 90.66, + "confidence": 0.874 + }, + { + "text": "them,", + "start": 90.66, + "end": 90.7, + "confidence": 0.971 + }, + { + "text": "got", + "start": 90.7, + "end": 90.74, + "confidence": 0.874 + }, + { + "text": "them,", + "start": 90.74, + "end": 90.78, + "confidence": 0.971 + }, + { + "text": "got", + "start": 90.78, + "end": 90.82, + "confidence": 0.88 + }, + { + "text": "them,", + "start": 90.82, + "end": 90.86, + "confidence": 0.971 + }, + { + "text": "got", + "start": 90.86, + "end": 90.9, + "confidence": 0.884 + }, + { + "text": "them,", + "start": 90.9, + "end": 90.94, + "confidence": 0.973 + }, + { + "text": "got", + "start": 90.94, + "end": 90.98, + "confidence": 0.883 + }, + { + "text": "them,", + "start": 90.98, + "end": 91.02, + "confidence": 0.973 + }, + { + "text": "got", + "start": 91.02, + "end": 91.06, + "confidence": 0.884 + }, + { + "text": "them,", + "start": 91.06, + "end": 91.1, + "confidence": 0.973 + }, + { + "text": "got", + "start": 91.1, + "end": 91.14, + "confidence": 0.893 + }, + { + "text": "them,", + "start": 91.14, + "end": 91.18, + "confidence": 0.975 + }, + { + "text": "got", + "start": 91.18, + "end": 91.22, + "confidence": 0.894 + }, + { + "text": "them,", + "start": 91.22, + "end": 91.26, + "confidence": 0.975 + }, + { + "text": "got", + "start": 91.26, + "end": 91.3, + "confidence": 0.9 + }, + { + "text": "them,", + "start": 91.3, + "end": 91.34, + "confidence": 0.976 + }, + { + "text": "got", + "start": 91.34, + "end": 91.38, + "confidence": 0.906 + }, + { + "text": "them,", + "start": 91.38, + "end": 91.42, + "confidence": 0.977 + }, + { + "text": "got", + "start": 91.42, + "end": 91.46, + "confidence": 0.905 + }, + { + "text": "them,", + "start": 91.46, + "end": 91.5, + "confidence": 0.978 + }, + { + "text": "got", + "start": 91.5, + "end": 91.54, + "confidence": 0.915 + }, + { + "text": "them,", + "start": 91.54, + "end": 91.58, + "confidence": 0.979 + }, + { + "text": "got", + "start": 91.58, + "end": 91.62, + "confidence": 0.92 + }, + { + "text": "them,", + "start": 91.62, + "end": 91.66, + "confidence": 0.98 + }, + { + "text": "got", + "start": 91.66, + "end": 91.7, + "confidence": 0.922 + }, + { + "text": "them,", + "start": 91.7, + "end": 91.74, + "confidence": 0.981 + }, + { + "text": "got", + "start": 91.74, + "end": 91.78, + "confidence": 0.925 + }, + { + "text": "them,", + "start": 91.78, + "end": 91.82, + "confidence": 0.982 + }, + { + "text": "got", + "start": 91.82, + "end": 91.86, + "confidence": 0.932 + }, + { + "text": "them,", + "start": 91.86, + "end": 91.9, + "confidence": 0.983 + }, + { + "text": "got", + "start": 91.9, + "end": 91.94, + "confidence": 0.936 + }, + { + "text": "them,", + "start": 91.94, + "end": 91.98, + "confidence": 0.984 + }, + { + "text": "got", + "start": 91.98, + "end": 92.02, + "confidence": 0.935 + }, + { + "text": "them,", + "start": 92.02, + "end": 92.06, + "confidence": 0.985 + }, + { + "text": "got", + "start": 92.06, + "end": 92.1, + "confidence": 0.941 + }, + { + "text": "them,", + "start": 92.1, + "end": 92.14, + "confidence": 0.986 + }, + { + "text": "got", + "start": 92.14, + "end": 92.18, + "confidence": 0.946 + }, + { + "text": "them,", + "start": 92.18, + "end": 92.22, + "confidence": 0.986 + }, + { + "text": "got", + "start": 92.22, + "end": 92.26, + "confidence": 0.95 + }, + { + "text": "them,", + "start": 92.26, + "end": 92.3, + "confidence": 0.987 + }, + { + "text": "got", + "start": 92.3, + "end": 92.34, + "confidence": 0.951 + }, + { + "text": "them,", + "start": 92.34, + "end": 92.38, + "confidence": 0.987 + }, + { + "text": "got", + "start": 92.38, + "end": 92.42, + "confidence": 0.954 + }, + { + "text": "them,", + "start": 92.42, + "end": 92.46, + "confidence": 0.989 + }, + { + "text": "got", + "start": 92.46, + "end": 92.5, + "confidence": 0.959 + }, + { + "text": "them,", + "start": 92.5, + "end": 92.54, + "confidence": 0.989 + }, + { + "text": "got", + "start": 92.54, + "end": 92.58, + "confidence": 0.959 + }, + { + "text": "them,", + "start": 92.58, + "end": 92.62, + "confidence": 0.99 + }, + { + "text": "got", + "start": 92.62, + "end": 92.66, + "confidence": 0.963 + }, + { + "text": "them,", + "start": 92.66, + "end": 92.7, + "confidence": 0.991 + }, + { + "text": "got", + "start": 92.7, + "end": 92.74, + "confidence": 0.966 + }, + { + "text": "them,", + "start": 92.74, + "end": 92.78, + "confidence": 0.992 + }, + { + "text": "got", + "start": 92.78, + "end": 92.82, + "confidence": 0.967 + }, + { + "text": "them,", + "start": 92.82, + "end": 92.86, + "confidence": 0.992 + }, + { + "text": "got", + "start": 92.86, + "end": 92.9, + "confidence": 0.97 + }, + { + "text": "them,", + "start": 92.9, + "end": 92.94, + "confidence": 0.992 + }, + { + "text": "got", + "start": 92.94, + "end": 92.98, + "confidence": 0.971 + }, + { + "text": "them,", + "start": 92.98, + "end": 93.02, + "confidence": 0.993 + }, + { + "text": "got", + "start": 93.02, + "end": 93.06, + "confidence": 0.97 + }, + { + "text": "them,", + "start": 93.06, + "end": 93.1, + "confidence": 0.993 + }, + { + "text": "got", + "start": 93.1, + "end": 93.14, + "confidence": 0.973 + }, + { + "text": "them,", + "start": 93.14, + "end": 93.18, + "confidence": 0.993 + }, + { + "text": "got", + "start": 93.18, + "end": 93.22, + "confidence": 0.974 + }, + { + "text": "them,", + "start": 93.22, + "end": 93.26, + "confidence": 0.994 + }, + { + "text": "got", + "start": 93.26, + "end": 93.3, + "confidence": 0.974 + }, + { + "text": "them,", + "start": 93.3, + "end": 93.34, + "confidence": 0.994 + }, + { + "text": "got", + "start": 93.34, + "end": 93.38, + "confidence": 0.976 + }, + { + "text": "them,", + "start": 93.38, + "end": 93.42, + "confidence": 0.994 + }, + { + "text": "got", + "start": 93.42, + "end": 93.46, + "confidence": 0.978 + }, + { + "text": "them,", + "start": 93.46, + "end": 93.5, + "confidence": 0.995 + }, + { + "text": "got", + "start": 93.5, + "end": 93.54, + "confidence": 0.979 + }, + { + "text": "them,", + "start": 93.54, + "end": 93.58, + "confidence": 0.995 + }, + { + "text": "got", + "start": 93.58, + "end": 93.62, + "confidence": 0.98 + }, + { + "text": "them,", + "start": 93.62, + "end": 93.66, + "confidence": 0.995 + }, + { + "text": "got", + "start": 93.66, + "end": 93.7, + "confidence": 0.981 + }, + { + "text": "them,", + "start": 93.7, + "end": 93.74, + "confidence": 0.995 + }, + { + "text": "got", + "start": 93.74, + "end": 93.78, + "confidence": 0.98 + }, + { + "text": "them,", + "start": 93.78, + "end": 93.82, + "confidence": 0.995 + }, + { + "text": "got", + "start": 93.82, + "end": 93.86, + "confidence": 0.982 + }, + { + "text": "them,", + "start": 93.86, + "end": 93.9, + "confidence": 0.996 + }, + { + "text": "got", + "start": 93.9, + "end": 93.94, + "confidence": 0.982 + }, + { + "text": "them,", + "start": 93.94, + "end": 93.98, + "confidence": 0.996 + }, + { + "text": "got", + "start": 93.98, + "end": 94.02, + "confidence": 0.984 + }, + { + "text": "them,", + "start": 94.02, + "end": 94.06, + "confidence": 0.996 + }, + { + "text": "got", + "start": 94.06, + "end": 94.1, + "confidence": 0.984 + }, + { + "text": "them,", + "start": 94.1, + "end": 94.14, + "confidence": 0.996 + }, + { + "text": "got", + "start": 94.14, + "end": 94.18, + "confidence": 0.985 + }, + { + "text": "them,", + "start": 94.18, + "end": 94.22, + "confidence": 0.996 + }, + { + "text": "got", + "start": 94.22, + "end": 94.26, + "confidence": 0.986 + }, + { + "text": "them,", + "start": 94.26, + "end": 94.3, + "confidence": 0.996 + }, + { + "text": "got", + "start": 94.3, + "end": 94.34, + "confidence": 0.986 + }, + { + "text": "them,", + "start": 94.34, + "end": 94.38, + "confidence": 0.996 + }, + { + "text": "got", + "start": 94.38, + "end": 94.42, + "confidence": 0.987 + }, + { + "text": "them", + "start": 94.42, + "end": 115.0, + "confidence": 0.996 + } + ] + } + ], + "language": "en" +} \ No newline at end of file diff --git a/tests/expected/corner_cases.cpu/stucked_lm_apollo11.mp3.words.json b/tests/expected/corner_cases.cpu/stucked_lm_apollo11.mp3.words.json new file mode 100644 index 0000000000000000000000000000000000000000..527def1f7142f05644333ecb9e358b7e067d0468 --- /dev/null +++ b/tests/expected/corner_cases.cpu/stucked_lm_apollo11.mp3.words.json @@ -0,0 +1,3814 @@ +{ + "text": " Apollo 11, Houston we got a recommendation for you on your Soyuz-VA GLEME GVA. Alright, okay, we like to say that they make the one that's on the helmet we're going to have in B1. And you can put the other one on the mic helmet with those GVA blizzard frames. Alright, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them", + "segments": [ + { + "id": 0, + "seek": 0, + "start": 0.64, + "end": 6.94, + "text": " Apollo 11, Houston we got a recommendation for you on your Soyuz-VA GLEME GVA.", + "tokens": [ + 25187, + 2975, + 11, + 18717, + 321, + 658, + 257, + 11879, + 337, + 291, + 322, + 428, + 24758, + 3334, + 12, + 20914, + 460, + 2634, + 15454, + 460, + 20914, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.7224321867290296, + "compression_ratio": 1.39247311827957, + "no_speech_prob": 0.45045843720436096, + "confidence": 0.542, + "words": [ + { + "text": "Apollo", + "start": 0.64, + "end": 0.98, + "confidence": 0.155 + }, + { + "text": "11,", + "start": 0.98, + "end": 1.54, + "confidence": 0.977 + }, + { + "text": "Houston", + "start": 1.54, + "end": 1.8, + "confidence": 0.986 + }, + { + "text": "we", + "start": 1.8, + "end": 1.98, + "confidence": 0.52 + }, + { + "text": "got", + "start": 1.98, + "end": 2.16, + "confidence": 0.824 + }, + { + "text": "a", + "start": 2.16, + "end": 2.38, + "confidence": 0.989 + }, + { + "text": "recommendation", + "start": 2.38, + "end": 3.1, + "confidence": 0.968 + }, + { + "text": "for", + "start": 3.1, + "end": 3.52, + "confidence": 0.947 + }, + { + "text": "you", + "start": 3.52, + "end": 3.9, + "confidence": 0.984 + }, + { + "text": "on", + "start": 3.9, + "end": 4.28, + "confidence": 0.909 + }, + { + "text": "your", + "start": 4.28, + "end": 4.32, + "confidence": 0.971 + }, + { + "text": "Soyuz-VA", + "start": 4.32, + "end": 5.38, + "confidence": 0.26 + }, + { + "text": "GLEME", + "start": 5.38, + "end": 6.04, + "confidence": 0.478 + }, + { + "text": "GVA.", + "start": 6.04, + "end": 6.94, + "confidence": 0.436 + } + ] + }, + { + "id": 1, + "seek": 0, + "start": 10.82, + "end": 19.24, + "text": " Alright, okay, we like to say that they make the one that's on the helmet we're going to have in B1.", + "tokens": [ + 2798, + 11, + 1392, + 11, + 321, + 411, + 281, + 584, + 300, + 436, + 652, + 264, + 472, + 300, + 311, + 322, + 264, + 15922, + 321, + 434, + 516, + 281, + 362, + 294, + 363, + 16, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.7224321867290296, + "compression_ratio": 1.39247311827957, + "no_speech_prob": 0.45045843720436096, + "confidence": 0.468, + "words": [ + { + "text": "Alright,", + "start": 10.82, + "end": 12.5, + "confidence": 0.309 + }, + { + "text": "okay,", + "start": 12.5, + "end": 12.94, + "confidence": 0.507 + }, + { + "text": "we", + "start": 12.94, + "end": 13.12, + "confidence": 0.61 + }, + { + "text": "like", + "start": 13.12, + "end": 13.48, + "confidence": 0.503 + }, + { + "text": "to", + "start": 13.48, + "end": 13.68, + "confidence": 0.264 + }, + { + "text": "say", + "start": 13.68, + "end": 14.98, + "confidence": 0.138 + }, + { + "text": "that", + "start": 14.98, + "end": 15.56, + "confidence": 0.2 + }, + { + "text": "they", + "start": 15.56, + "end": 15.6, + "confidence": 0.418 + }, + { + "text": "make", + "start": 15.6, + "end": 15.76, + "confidence": 0.398 + }, + { + "text": "the", + "start": 15.76, + "end": 15.92, + "confidence": 0.253 + }, + { + "text": "one", + "start": 15.92, + "end": 16.1, + "confidence": 0.608 + }, + { + "text": "that's", + "start": 16.1, + "end": 16.34, + "confidence": 0.443 + }, + { + "text": "on", + "start": 16.34, + "end": 16.62, + "confidence": 0.595 + }, + { + "text": "the", + "start": 16.62, + "end": 16.96, + "confidence": 0.871 + }, + { + "text": "helmet", + "start": 16.96, + "end": 17.36, + "confidence": 0.853 + }, + { + "text": "we're", + "start": 17.36, + "end": 17.86, + "confidence": 0.299 + }, + { + "text": "going", + "start": 17.86, + "end": 18.06, + "confidence": 0.6 + }, + { + "text": "to", + "start": 18.06, + "end": 18.22, + "confidence": 0.818 + }, + { + "text": "have", + "start": 18.22, + "end": 18.26, + "confidence": 0.84 + }, + { + "text": "in", + "start": 18.26, + "end": 18.42, + "confidence": 0.717 + }, + { + "text": "B1.", + "start": 18.42, + "end": 19.24, + "confidence": 0.764 + } + ] + }, + { + "id": 2, + "seek": 0, + "start": 20.1, + "end": 24.76, + "text": " And you can put the other one on the mic helmet with those GVA blizzard frames.", + "tokens": [ + 400, + 291, + 393, + 829, + 264, + 661, + 472, + 322, + 264, + 3123, + 15922, + 365, + 729, + 460, + 20914, + 888, + 31062, + 12083, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.7224321867290296, + "compression_ratio": 1.39247311827957, + "no_speech_prob": 0.45045843720436096, + "confidence": 0.485, + "words": [ + { + "text": "And", + "start": 20.1, + "end": 20.24, + "confidence": 0.67 + }, + { + "text": "you", + "start": 20.24, + "end": 20.38, + "confidence": 0.947 + }, + { + "text": "can", + "start": 20.38, + "end": 20.54, + "confidence": 0.729 + }, + { + "text": "put", + "start": 20.54, + "end": 20.72, + "confidence": 0.98 + }, + { + "text": "the", + "start": 20.72, + "end": 20.88, + "confidence": 0.989 + }, + { + "text": "other", + "start": 20.88, + "end": 21.08, + "confidence": 0.991 + }, + { + "text": "one", + "start": 21.08, + "end": 21.26, + "confidence": 0.978 + }, + { + "text": "on", + "start": 21.26, + "end": 21.68, + "confidence": 0.989 + }, + { + "text": "the", + "start": 21.68, + "end": 21.96, + "confidence": 0.52 + }, + { + "text": "mic", + "start": 21.96, + "end": 22.58, + "confidence": 0.413 + }, + { + "text": "helmet", + "start": 22.58, + "end": 22.94, + "confidence": 0.882 + }, + { + "text": "with", + "start": 22.94, + "end": 23.2, + "confidence": 0.425 + }, + { + "text": "those", + "start": 23.2, + "end": 23.5, + "confidence": 0.465 + }, + { + "text": "GVA", + "start": 23.5, + "end": 23.88, + "confidence": 0.216 + }, + { + "text": "blizzard", + "start": 23.88, + "end": 24.32, + "confidence": 0.107 + }, + { + "text": "frames.", + "start": 24.32, + "end": 24.76, + "confidence": 0.254 + } + ] + }, + { + "id": 3, + "seek": 2500, + "start": 25.02, + "end": 55.0, + "text": " Alright, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them", + "tokens": [ + 50364, + 2798, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552 + ], + "temperature": 0.0, + "avg_logprob": -0.1079042222764757, + "compression_ratio": 24.096774193548388, + "no_speech_prob": 0.00111382023897022, + "confidence": 0.936, + "words": [ + { + "text": "Alright,", + "start": 25.02, + "end": 31.98, + "confidence": 0.213 + }, + { + "text": "got", + "start": 31.98, + "end": 32.02, + "confidence": 0.333 + }, + { + "text": "them,", + "start": 32.02, + "end": 32.58, + "confidence": 0.334 + }, + { + "text": "got", + "start": 32.58, + "end": 33.08, + "confidence": 0.526 + }, + { + "text": "them,", + "start": 33.08, + "end": 33.78, + "confidence": 0.942 + }, + { + "text": "got", + "start": 33.78, + "end": 33.82, + "confidence": 0.539 + }, + { + "text": "them,", + "start": 33.82, + "end": 34.18, + "confidence": 0.924 + }, + { + "text": "got", + "start": 34.18, + "end": 34.22, + "confidence": 0.48 + }, + { + "text": "them,", + "start": 34.22, + "end": 35.14, + "confidence": 0.907 + }, + { + "text": "got", + "start": 35.14, + "end": 35.18, + "confidence": 0.604 + }, + { + "text": "them,", + "start": 35.18, + "end": 35.22, + "confidence": 0.922 + }, + { + "text": "got", + "start": 35.22, + "end": 35.5, + "confidence": 0.661 + }, + { + "text": "them,", + "start": 35.5, + "end": 35.9, + "confidence": 0.948 + }, + { + "text": "got", + "start": 35.9, + "end": 35.94, + "confidence": 0.743 + }, + { + "text": "them,", + "start": 35.94, + "end": 35.98, + "confidence": 0.968 + }, + { + "text": "got", + "start": 35.98, + "end": 36.02, + "confidence": 0.825 + }, + { + "text": "them,", + "start": 36.02, + "end": 36.06, + "confidence": 0.975 + }, + { + "text": "got", + "start": 36.06, + "end": 36.1, + "confidence": 0.839 + }, + { + "text": "them,", + "start": 36.1, + "end": 36.14, + "confidence": 0.981 + }, + { + "text": "got", + "start": 36.14, + "end": 36.18, + "confidence": 0.891 + }, + { + "text": "them,", + "start": 36.18, + "end": 36.22, + "confidence": 0.985 + }, + { + "text": "got", + "start": 36.22, + "end": 36.26, + "confidence": 0.919 + }, + { + "text": "them,", + "start": 36.26, + "end": 36.3, + "confidence": 0.987 + }, + { + "text": "got", + "start": 36.3, + "end": 36.34, + "confidence": 0.937 + }, + { + "text": "them,", + "start": 36.34, + "end": 36.38, + "confidence": 0.988 + }, + { + "text": "got", + "start": 36.38, + "end": 36.42, + "confidence": 0.941 + }, + { + "text": "them,", + "start": 36.42, + "end": 36.46, + "confidence": 0.987 + }, + { + "text": "got", + "start": 36.46, + "end": 36.5, + "confidence": 0.944 + }, + { + "text": "them,", + "start": 36.5, + "end": 36.54, + "confidence": 0.989 + }, + { + "text": "got", + "start": 36.54, + "end": 36.58, + "confidence": 0.945 + }, + { + "text": "them,", + "start": 36.58, + "end": 36.62, + "confidence": 0.99 + }, + { + "text": "got", + "start": 36.62, + "end": 36.66, + "confidence": 0.943 + }, + { + "text": "them,", + "start": 36.66, + "end": 36.7, + "confidence": 0.99 + }, + { + "text": "got", + "start": 36.7, + "end": 36.74, + "confidence": 0.944 + }, + { + "text": "them,", + "start": 36.74, + "end": 36.78, + "confidence": 0.991 + }, + { + "text": "got", + "start": 36.78, + "end": 36.82, + "confidence": 0.945 + }, + { + "text": "them,", + "start": 36.82, + "end": 36.86, + "confidence": 0.991 + }, + { + "text": "got", + "start": 36.86, + "end": 36.9, + "confidence": 0.951 + }, + { + "text": "them,", + "start": 36.9, + "end": 36.94, + "confidence": 0.991 + }, + { + "text": "got", + "start": 36.94, + "end": 36.98, + "confidence": 0.952 + }, + { + "text": "them,", + "start": 36.98, + "end": 37.02, + "confidence": 0.992 + }, + { + "text": "got", + "start": 37.02, + "end": 37.06, + "confidence": 0.956 + }, + { + "text": "them,", + "start": 37.06, + "end": 37.1, + "confidence": 0.992 + }, + { + "text": "got", + "start": 37.1, + "end": 37.14, + "confidence": 0.958 + }, + { + "text": "them,", + "start": 37.14, + "end": 37.18, + "confidence": 0.992 + }, + { + "text": "got", + "start": 37.18, + "end": 37.22, + "confidence": 0.958 + }, + { + "text": "them,", + "start": 37.22, + "end": 37.26, + "confidence": 0.992 + }, + { + "text": "got", + "start": 37.26, + "end": 37.3, + "confidence": 0.959 + }, + { + "text": "them,", + "start": 37.3, + "end": 37.34, + "confidence": 0.993 + }, + { + "text": "got", + "start": 37.34, + "end": 37.38, + "confidence": 0.961 + }, + { + "text": "them,", + "start": 37.38, + "end": 37.42, + "confidence": 0.993 + }, + { + "text": "got", + "start": 37.42, + "end": 37.46, + "confidence": 0.961 + }, + { + "text": "them,", + "start": 37.46, + "end": 37.5, + "confidence": 0.993 + }, + { + "text": "got", + "start": 37.5, + "end": 37.54, + "confidence": 0.962 + }, + { + "text": "them,", + "start": 37.54, + "end": 37.58, + "confidence": 0.993 + }, + { + "text": "got", + "start": 37.58, + "end": 37.62, + "confidence": 0.963 + }, + { + "text": "them,", + "start": 37.62, + "end": 37.66, + "confidence": 0.993 + }, + { + "text": "got", + "start": 37.66, + "end": 37.7, + "confidence": 0.965 + }, + { + "text": "them,", + "start": 37.7, + "end": 37.74, + "confidence": 0.993 + }, + { + "text": "got", + "start": 37.74, + "end": 37.78, + "confidence": 0.965 + }, + { + "text": "them,", + "start": 37.78, + "end": 37.82, + "confidence": 0.993 + }, + { + "text": "got", + "start": 37.82, + "end": 37.86, + "confidence": 0.966 + }, + { + "text": "them,", + "start": 37.86, + "end": 37.9, + "confidence": 0.994 + }, + { + "text": "got", + "start": 37.9, + "end": 37.94, + "confidence": 0.967 + }, + { + "text": "them,", + "start": 37.94, + "end": 37.98, + "confidence": 0.994 + }, + { + "text": "got", + "start": 37.98, + "end": 38.02, + "confidence": 0.968 + }, + { + "text": "them,", + "start": 38.02, + "end": 38.06, + "confidence": 0.994 + }, + { + "text": "got", + "start": 38.06, + "end": 38.1, + "confidence": 0.969 + }, + { + "text": "them,", + "start": 38.1, + "end": 38.14, + "confidence": 0.994 + }, + { + "text": "got", + "start": 38.14, + "end": 38.18, + "confidence": 0.97 + }, + { + "text": "them,", + "start": 38.18, + "end": 38.22, + "confidence": 0.994 + }, + { + "text": "got", + "start": 38.22, + "end": 38.26, + "confidence": 0.971 + }, + { + "text": "them,", + "start": 38.26, + "end": 38.3, + "confidence": 0.994 + }, + { + "text": "got", + "start": 38.3, + "end": 38.34, + "confidence": 0.972 + }, + { + "text": "them,", + "start": 38.34, + "end": 38.38, + "confidence": 0.994 + }, + { + "text": "got", + "start": 38.38, + "end": 38.42, + "confidence": 0.974 + }, + { + "text": "them,", + "start": 38.42, + "end": 38.46, + "confidence": 0.994 + }, + { + "text": "got", + "start": 38.46, + "end": 38.5, + "confidence": 0.975 + }, + { + "text": "them,", + "start": 38.5, + "end": 38.54, + "confidence": 0.994 + }, + { + "text": "got", + "start": 38.54, + "end": 38.58, + "confidence": 0.978 + }, + { + "text": "them,", + "start": 38.58, + "end": 38.62, + "confidence": 0.994 + }, + { + "text": "got", + "start": 38.62, + "end": 38.66, + "confidence": 0.978 + }, + { + "text": "them,", + "start": 38.66, + "end": 38.7, + "confidence": 0.994 + }, + { + "text": "got", + "start": 38.7, + "end": 38.74, + "confidence": 0.98 + }, + { + "text": "them,", + "start": 38.74, + "end": 38.78, + "confidence": 0.994 + }, + { + "text": "got", + "start": 38.78, + "end": 38.82, + "confidence": 0.981 + }, + { + "text": "them,", + "start": 38.82, + "end": 38.86, + "confidence": 0.994 + }, + { + "text": "got", + "start": 38.86, + "end": 38.9, + "confidence": 0.984 + }, + { + "text": "them,", + "start": 38.9, + "end": 38.94, + "confidence": 0.995 + }, + { + "text": "got", + "start": 38.94, + "end": 38.98, + "confidence": 0.984 + }, + { + "text": "them,", + "start": 38.98, + "end": 39.02, + "confidence": 0.995 + }, + { + "text": "got", + "start": 39.02, + "end": 39.06, + "confidence": 0.986 + }, + { + "text": "them,", + "start": 39.06, + "end": 39.1, + "confidence": 0.995 + }, + { + "text": "got", + "start": 39.1, + "end": 39.14, + "confidence": 0.987 + }, + { + "text": "them,", + "start": 39.14, + "end": 39.18, + "confidence": 0.995 + }, + { + "text": "got", + "start": 39.18, + "end": 39.22, + "confidence": 0.987 + }, + { + "text": "them,", + "start": 39.22, + "end": 39.26, + "confidence": 0.995 + }, + { + "text": "got", + "start": 39.26, + "end": 39.3, + "confidence": 0.985 + }, + { + "text": "them,", + "start": 39.3, + "end": 39.34, + "confidence": 0.995 + }, + { + "text": "got", + "start": 39.34, + "end": 39.38, + "confidence": 0.989 + }, + { + "text": "them,", + "start": 39.38, + "end": 39.42, + "confidence": 0.995 + }, + { + "text": "got", + "start": 39.42, + "end": 39.46, + "confidence": 0.99 + }, + { + "text": "them,", + "start": 39.46, + "end": 39.5, + "confidence": 0.995 + }, + { + "text": "got", + "start": 39.5, + "end": 39.54, + "confidence": 0.99 + }, + { + "text": "them,", + "start": 39.54, + "end": 39.58, + "confidence": 0.995 + }, + { + "text": "got", + "start": 39.58, + "end": 39.62, + "confidence": 0.99 + }, + { + "text": "them,", + "start": 39.62, + "end": 39.66, + "confidence": 0.995 + }, + { + "text": "got", + "start": 39.66, + "end": 39.7, + "confidence": 0.991 + }, + { + "text": "them,", + "start": 39.7, + "end": 39.74, + "confidence": 0.995 + }, + { + "text": "got", + "start": 39.74, + "end": 39.78, + "confidence": 0.991 + }, + { + "text": "them,", + "start": 39.78, + "end": 39.82, + "confidence": 0.995 + }, + { + "text": "got", + "start": 39.82, + "end": 39.86, + "confidence": 0.991 + }, + { + "text": "them,", + "start": 39.86, + "end": 39.9, + "confidence": 0.995 + }, + { + "text": "got", + "start": 39.9, + "end": 39.94, + "confidence": 0.992 + }, + { + "text": "them,", + "start": 39.94, + "end": 39.98, + "confidence": 0.995 + }, + { + "text": "got", + "start": 39.98, + "end": 40.02, + "confidence": 0.992 + }, + { + "text": "them,", + "start": 40.02, + "end": 40.06, + "confidence": 0.995 + }, + { + "text": "got", + "start": 40.06, + "end": 40.1, + "confidence": 0.992 + }, + { + "text": "them,", + "start": 40.1, + "end": 40.14, + "confidence": 0.995 + }, + { + "text": "got", + "start": 40.14, + "end": 40.18, + "confidence": 0.992 + }, + { + "text": "them,", + "start": 40.18, + "end": 40.22, + "confidence": 0.995 + }, + { + "text": "got", + "start": 40.22, + "end": 40.26, + "confidence": 0.993 + }, + { + "text": "them,", + "start": 40.26, + "end": 40.3, + "confidence": 0.995 + }, + { + "text": "got", + "start": 40.3, + "end": 40.34, + "confidence": 0.993 + }, + { + "text": "them,", + "start": 40.34, + "end": 40.38, + "confidence": 0.995 + }, + { + "text": "got", + "start": 40.38, + "end": 40.42, + "confidence": 0.993 + }, + { + "text": "them,", + "start": 40.42, + "end": 40.46, + "confidence": 0.995 + }, + { + "text": "got", + "start": 40.46, + "end": 40.5, + "confidence": 0.994 + }, + { + "text": "them,", + "start": 40.5, + "end": 40.54, + "confidence": 0.995 + }, + { + "text": "got", + "start": 40.54, + "end": 40.58, + "confidence": 0.994 + }, + { + "text": "them,", + "start": 40.58, + "end": 40.62, + "confidence": 0.995 + }, + { + "text": "got", + "start": 40.62, + "end": 40.66, + "confidence": 0.994 + }, + { + "text": "them,", + "start": 40.66, + "end": 40.7, + "confidence": 0.995 + }, + { + "text": "got", + "start": 40.7, + "end": 40.74, + "confidence": 0.995 + }, + { + "text": "them,", + "start": 40.74, + "end": 40.78, + "confidence": 0.996 + }, + { + "text": "got", + "start": 40.78, + "end": 40.82, + "confidence": 0.995 + }, + { + "text": "them,", + "start": 40.82, + "end": 40.86, + "confidence": 0.996 + }, + { + "text": "got", + "start": 40.86, + "end": 40.9, + "confidence": 0.995 + }, + { + "text": "them,", + "start": 40.9, + "end": 40.94, + "confidence": 0.996 + }, + { + "text": "got", + "start": 40.94, + "end": 40.98, + "confidence": 0.995 + }, + { + "text": "them,", + "start": 40.98, + "end": 41.02, + "confidence": 0.996 + }, + { + "text": "got", + "start": 41.02, + "end": 41.06, + "confidence": 0.995 + }, + { + "text": "them,", + "start": 41.06, + "end": 42.94, + "confidence": 0.996 + }, + { + "text": "got", + "start": 42.94, + "end": 46.82, + "confidence": 0.995 + }, + { + "text": "them,", + "start": 46.82, + "end": 47.8, + "confidence": 0.996 + }, + { + "text": "got", + "start": 47.8, + "end": 48.58, + "confidence": 0.996 + }, + { + "text": "them,", + "start": 48.58, + "end": 50.82, + "confidence": 0.996 + }, + { + "text": "got", + "start": 50.82, + "end": 51.64, + "confidence": 0.996 + }, + { + "text": "them", + "start": 51.64, + "end": 55.0, + "confidence": 0.997 + } + ] + }, + { + "id": 4, + "seek": 5500, + "start": 72.06, + "end": 85.0, + "text": " got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them", + "tokens": [ + 50364, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552 + ], + "temperature": 0.0, + "avg_logprob": -0.053046889369263245, + "compression_ratio": 29.52, + "no_speech_prob": 0.24410122632980347, + "confidence": 0.948, + "words": [ + { + "text": "got", + "start": 72.06, + "end": 72.1, + "confidence": 0.214 + }, + { + "text": "them,", + "start": 72.1, + "end": 72.14, + "confidence": 0.95 + }, + { + "text": "got", + "start": 72.14, + "end": 72.18, + "confidence": 0.954 + }, + { + "text": "them,", + "start": 72.18, + "end": 72.22, + "confidence": 0.997 + }, + { + "text": "got", + "start": 72.22, + "end": 72.26, + "confidence": 0.963 + }, + { + "text": "them,", + "start": 72.26, + "end": 72.3, + "confidence": 0.997 + }, + { + "text": "got", + "start": 72.3, + "end": 72.34, + "confidence": 0.957 + }, + { + "text": "them,", + "start": 72.34, + "end": 72.38, + "confidence": 0.997 + }, + { + "text": "got", + "start": 72.38, + "end": 72.42, + "confidence": 0.938 + }, + { + "text": "them,", + "start": 72.42, + "end": 72.46, + "confidence": 0.993 + }, + { + "text": "got", + "start": 72.46, + "end": 72.5, + "confidence": 0.912 + }, + { + "text": "them,", + "start": 72.5, + "end": 72.54, + "confidence": 0.988 + }, + { + "text": "got", + "start": 72.54, + "end": 72.58, + "confidence": 0.873 + }, + { + "text": "them,", + "start": 72.58, + "end": 72.62, + "confidence": 0.982 + }, + { + "text": "got", + "start": 72.62, + "end": 72.66, + "confidence": 0.863 + }, + { + "text": "them,", + "start": 72.66, + "end": 72.7, + "confidence": 0.984 + }, + { + "text": "got", + "start": 72.7, + "end": 72.74, + "confidence": 0.889 + }, + { + "text": "them,", + "start": 72.74, + "end": 72.78, + "confidence": 0.984 + }, + { + "text": "got", + "start": 72.78, + "end": 72.82, + "confidence": 0.852 + }, + { + "text": "them,", + "start": 72.82, + "end": 72.86, + "confidence": 0.925 + }, + { + "text": "got", + "start": 72.86, + "end": 72.9, + "confidence": 0.56 + }, + { + "text": "them,", + "start": 72.9, + "end": 72.94, + "confidence": 0.958 + }, + { + "text": "got", + "start": 72.94, + "end": 72.98, + "confidence": 0.81 + }, + { + "text": "them,", + "start": 72.98, + "end": 73.02, + "confidence": 0.976 + }, + { + "text": "got", + "start": 73.02, + "end": 73.06, + "confidence": 0.843 + }, + { + "text": "them,", + "start": 73.06, + "end": 73.1, + "confidence": 0.977 + }, + { + "text": "got", + "start": 73.1, + "end": 73.14, + "confidence": 0.835 + }, + { + "text": "them,", + "start": 73.14, + "end": 73.18, + "confidence": 0.977 + }, + { + "text": "got", + "start": 73.18, + "end": 73.22, + "confidence": 0.836 + }, + { + "text": "them,", + "start": 73.22, + "end": 73.26, + "confidence": 0.979 + }, + { + "text": "got", + "start": 73.26, + "end": 73.3, + "confidence": 0.853 + }, + { + "text": "them,", + "start": 73.3, + "end": 73.34, + "confidence": 0.983 + }, + { + "text": "got", + "start": 73.34, + "end": 73.38, + "confidence": 0.874 + }, + { + "text": "them,", + "start": 73.38, + "end": 73.42, + "confidence": 0.986 + }, + { + "text": "got", + "start": 73.42, + "end": 73.46, + "confidence": 0.892 + }, + { + "text": "them,", + "start": 73.46, + "end": 73.5, + "confidence": 0.985 + }, + { + "text": "got", + "start": 73.5, + "end": 73.54, + "confidence": 0.885 + }, + { + "text": "them,", + "start": 73.54, + "end": 73.58, + "confidence": 0.986 + }, + { + "text": "got", + "start": 73.58, + "end": 73.62, + "confidence": 0.877 + }, + { + "text": "them,", + "start": 73.62, + "end": 73.66, + "confidence": 0.986 + }, + { + "text": "got", + "start": 73.66, + "end": 73.7, + "confidence": 0.873 + }, + { + "text": "them,", + "start": 73.7, + "end": 73.74, + "confidence": 0.987 + }, + { + "text": "got", + "start": 73.74, + "end": 73.78, + "confidence": 0.871 + }, + { + "text": "them,", + "start": 73.78, + "end": 73.82, + "confidence": 0.987 + }, + { + "text": "got", + "start": 73.82, + "end": 73.86, + "confidence": 0.88 + }, + { + "text": "them,", + "start": 73.86, + "end": 73.9, + "confidence": 0.988 + }, + { + "text": "got", + "start": 73.9, + "end": 73.94, + "confidence": 0.883 + }, + { + "text": "them,", + "start": 73.94, + "end": 73.98, + "confidence": 0.989 + }, + { + "text": "got", + "start": 73.98, + "end": 74.02, + "confidence": 0.889 + }, + { + "text": "them,", + "start": 74.02, + "end": 74.06, + "confidence": 0.989 + }, + { + "text": "got", + "start": 74.06, + "end": 74.1, + "confidence": 0.895 + }, + { + "text": "them,", + "start": 74.1, + "end": 74.14, + "confidence": 0.99 + }, + { + "text": "got", + "start": 74.14, + "end": 74.18, + "confidence": 0.902 + }, + { + "text": "them,", + "start": 74.18, + "end": 74.22, + "confidence": 0.99 + }, + { + "text": "got", + "start": 74.22, + "end": 74.26, + "confidence": 0.905 + }, + { + "text": "them,", + "start": 74.26, + "end": 74.3, + "confidence": 0.991 + }, + { + "text": "got", + "start": 74.3, + "end": 74.34, + "confidence": 0.911 + }, + { + "text": "them,", + "start": 74.34, + "end": 74.38, + "confidence": 0.991 + }, + { + "text": "got", + "start": 74.38, + "end": 74.42, + "confidence": 0.916 + }, + { + "text": "them,", + "start": 74.42, + "end": 74.46, + "confidence": 0.991 + }, + { + "text": "got", + "start": 74.46, + "end": 74.5, + "confidence": 0.919 + }, + { + "text": "them,", + "start": 74.5, + "end": 74.54, + "confidence": 0.991 + }, + { + "text": "got", + "start": 74.54, + "end": 74.58, + "confidence": 0.922 + }, + { + "text": "them,", + "start": 74.58, + "end": 74.62, + "confidence": 0.992 + }, + { + "text": "got", + "start": 74.62, + "end": 74.66, + "confidence": 0.93 + }, + { + "text": "them,", + "start": 74.66, + "end": 74.7, + "confidence": 0.992 + }, + { + "text": "got", + "start": 74.7, + "end": 74.74, + "confidence": 0.932 + }, + { + "text": "them,", + "start": 74.74, + "end": 74.78, + "confidence": 0.992 + }, + { + "text": "got", + "start": 74.78, + "end": 74.82, + "confidence": 0.937 + }, + { + "text": "them,", + "start": 74.82, + "end": 74.86, + "confidence": 0.992 + }, + { + "text": "got", + "start": 74.86, + "end": 74.9, + "confidence": 0.943 + }, + { + "text": "them,", + "start": 74.9, + "end": 74.94, + "confidence": 0.992 + }, + { + "text": "got", + "start": 74.94, + "end": 74.98, + "confidence": 0.944 + }, + { + "text": "them,", + "start": 74.98, + "end": 75.02, + "confidence": 0.992 + }, + { + "text": "got", + "start": 75.02, + "end": 75.06, + "confidence": 0.95 + }, + { + "text": "them,", + "start": 75.06, + "end": 75.1, + "confidence": 0.992 + }, + { + "text": "got", + "start": 75.1, + "end": 75.14, + "confidence": 0.953 + }, + { + "text": "them,", + "start": 75.14, + "end": 75.18, + "confidence": 0.993 + }, + { + "text": "got", + "start": 75.18, + "end": 75.22, + "confidence": 0.955 + }, + { + "text": "them,", + "start": 75.22, + "end": 75.26, + "confidence": 0.992 + }, + { + "text": "got", + "start": 75.26, + "end": 75.3, + "confidence": 0.956 + }, + { + "text": "them,", + "start": 75.3, + "end": 75.34, + "confidence": 0.992 + }, + { + "text": "got", + "start": 75.34, + "end": 75.38, + "confidence": 0.96 + }, + { + "text": "them,", + "start": 75.38, + "end": 75.42, + "confidence": 0.992 + }, + { + "text": "got", + "start": 75.42, + "end": 75.46, + "confidence": 0.961 + }, + { + "text": "them,", + "start": 75.46, + "end": 75.5, + "confidence": 0.993 + }, + { + "text": "got", + "start": 75.5, + "end": 75.54, + "confidence": 0.961 + }, + { + "text": "them,", + "start": 75.54, + "end": 75.58, + "confidence": 0.992 + }, + { + "text": "got", + "start": 75.58, + "end": 75.62, + "confidence": 0.963 + }, + { + "text": "them,", + "start": 75.62, + "end": 75.66, + "confidence": 0.992 + }, + { + "text": "got", + "start": 75.66, + "end": 75.7, + "confidence": 0.965 + }, + { + "text": "them,", + "start": 75.7, + "end": 75.74, + "confidence": 0.992 + }, + { + "text": "got", + "start": 75.74, + "end": 75.78, + "confidence": 0.967 + }, + { + "text": "them,", + "start": 75.78, + "end": 75.82, + "confidence": 0.992 + }, + { + "text": "got", + "start": 75.82, + "end": 75.86, + "confidence": 0.967 + }, + { + "text": "them,", + "start": 75.86, + "end": 75.9, + "confidence": 0.992 + }, + { + "text": "got", + "start": 75.9, + "end": 75.94, + "confidence": 0.969 + }, + { + "text": "them,", + "start": 75.94, + "end": 75.98, + "confidence": 0.992 + }, + { + "text": "got", + "start": 75.98, + "end": 76.02, + "confidence": 0.97 + }, + { + "text": "them,", + "start": 76.02, + "end": 76.06, + "confidence": 0.992 + }, + { + "text": "got", + "start": 76.06, + "end": 76.1, + "confidence": 0.97 + }, + { + "text": "them,", + "start": 76.1, + "end": 76.14, + "confidence": 0.993 + }, + { + "text": "got", + "start": 76.14, + "end": 76.18, + "confidence": 0.972 + }, + { + "text": "them,", + "start": 76.18, + "end": 76.22, + "confidence": 0.992 + }, + { + "text": "got", + "start": 76.22, + "end": 76.26, + "confidence": 0.973 + }, + { + "text": "them,", + "start": 76.26, + "end": 76.3, + "confidence": 0.992 + }, + { + "text": "got", + "start": 76.3, + "end": 76.34, + "confidence": 0.973 + }, + { + "text": "them,", + "start": 76.34, + "end": 76.38, + "confidence": 0.992 + }, + { + "text": "got", + "start": 76.38, + "end": 76.42, + "confidence": 0.973 + }, + { + "text": "them,", + "start": 76.42, + "end": 76.46, + "confidence": 0.992 + }, + { + "text": "got", + "start": 76.46, + "end": 76.5, + "confidence": 0.974 + }, + { + "text": "them,", + "start": 76.5, + "end": 76.54, + "confidence": 0.992 + }, + { + "text": "got", + "start": 76.54, + "end": 76.58, + "confidence": 0.974 + }, + { + "text": "them,", + "start": 76.58, + "end": 76.62, + "confidence": 0.993 + }, + { + "text": "got", + "start": 76.62, + "end": 76.66, + "confidence": 0.974 + }, + { + "text": "them,", + "start": 76.66, + "end": 76.7, + "confidence": 0.992 + }, + { + "text": "got", + "start": 76.7, + "end": 76.74, + "confidence": 0.976 + }, + { + "text": "them,", + "start": 76.74, + "end": 76.78, + "confidence": 0.992 + }, + { + "text": "got", + "start": 76.78, + "end": 76.82, + "confidence": 0.975 + }, + { + "text": "them,", + "start": 76.82, + "end": 76.86, + "confidence": 0.992 + }, + { + "text": "got", + "start": 76.86, + "end": 76.9, + "confidence": 0.975 + }, + { + "text": "them,", + "start": 76.9, + "end": 76.94, + "confidence": 0.992 + }, + { + "text": "got", + "start": 76.94, + "end": 76.98, + "confidence": 0.976 + }, + { + "text": "them,", + "start": 76.98, + "end": 77.02, + "confidence": 0.993 + }, + { + "text": "got", + "start": 77.02, + "end": 77.06, + "confidence": 0.977 + }, + { + "text": "them,", + "start": 77.06, + "end": 77.1, + "confidence": 0.993 + }, + { + "text": "got", + "start": 77.1, + "end": 77.14, + "confidence": 0.977 + }, + { + "text": "them,", + "start": 77.14, + "end": 77.18, + "confidence": 0.993 + }, + { + "text": "got", + "start": 77.18, + "end": 77.22, + "confidence": 0.977 + }, + { + "text": "them,", + "start": 77.22, + "end": 77.26, + "confidence": 0.993 + }, + { + "text": "got", + "start": 77.26, + "end": 77.3, + "confidence": 0.978 + }, + { + "text": "them,", + "start": 77.3, + "end": 77.34, + "confidence": 0.993 + }, + { + "text": "got", + "start": 77.34, + "end": 77.38, + "confidence": 0.978 + }, + { + "text": "them,", + "start": 77.38, + "end": 77.42, + "confidence": 0.993 + }, + { + "text": "got", + "start": 77.42, + "end": 77.46, + "confidence": 0.978 + }, + { + "text": "them,", + "start": 77.46, + "end": 77.5, + "confidence": 0.993 + }, + { + "text": "got", + "start": 77.5, + "end": 77.54, + "confidence": 0.98 + }, + { + "text": "them,", + "start": 77.54, + "end": 77.58, + "confidence": 0.993 + }, + { + "text": "got", + "start": 77.58, + "end": 77.62, + "confidence": 0.98 + }, + { + "text": "them,", + "start": 77.62, + "end": 77.66, + "confidence": 0.993 + }, + { + "text": "got", + "start": 77.66, + "end": 77.7, + "confidence": 0.98 + }, + { + "text": "them,", + "start": 77.7, + "end": 77.74, + "confidence": 0.993 + }, + { + "text": "got", + "start": 77.74, + "end": 77.78, + "confidence": 0.981 + }, + { + "text": "them,", + "start": 77.78, + "end": 77.82, + "confidence": 0.993 + }, + { + "text": "got", + "start": 77.82, + "end": 77.86, + "confidence": 0.981 + }, + { + "text": "them,", + "start": 77.86, + "end": 79.56, + "confidence": 0.994 + }, + { + "text": "got", + "start": 79.56, + "end": 79.6, + "confidence": 0.981 + }, + { + "text": "them", + "start": 79.6, + "end": 85.0, + "confidence": 0.994 + } + ] + }, + { + "id": 5, + "seek": 8500, + "start": 85.02, + "end": 115.0, + "text": " got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them", + "tokens": [ + 50364, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552 + ], + "temperature": 0.0, + "avg_logprob": -0.04965524716227578, + "compression_ratio": 29.52, + "no_speech_prob": 0.6971923112869263, + "confidence": 0.948, + "words": [ + { + "text": "got", + "start": 85.02, + "end": 85.46, + "confidence": 0.438 + }, + { + "text": "them,", + "start": 85.46, + "end": 86.26, + "confidence": 0.943 + }, + { + "text": "got", + "start": 86.26, + "end": 86.78, + "confidence": 0.963 + }, + { + "text": "them,", + "start": 86.78, + "end": 87.18, + "confidence": 0.992 + }, + { + "text": "got", + "start": 87.18, + "end": 87.8, + "confidence": 0.963 + }, + { + "text": "them,", + "start": 87.8, + "end": 87.84, + "confidence": 0.993 + }, + { + "text": "got", + "start": 87.84, + "end": 88.6, + "confidence": 0.951 + }, + { + "text": "them,", + "start": 88.6, + "end": 88.64, + "confidence": 0.991 + }, + { + "text": "got", + "start": 88.64, + "end": 88.9, + "confidence": 0.934 + }, + { + "text": "them,", + "start": 88.9, + "end": 88.94, + "confidence": 0.988 + }, + { + "text": "got", + "start": 88.94, + "end": 88.98, + "confidence": 0.915 + }, + { + "text": "them,", + "start": 88.98, + "end": 89.02, + "confidence": 0.987 + }, + { + "text": "got", + "start": 89.02, + "end": 89.06, + "confidence": 0.9 + }, + { + "text": "them,", + "start": 89.06, + "end": 89.1, + "confidence": 0.985 + }, + { + "text": "got", + "start": 89.1, + "end": 89.14, + "confidence": 0.899 + }, + { + "text": "them,", + "start": 89.14, + "end": 89.18, + "confidence": 0.985 + }, + { + "text": "got", + "start": 89.18, + "end": 89.22, + "confidence": 0.907 + }, + { + "text": "them,", + "start": 89.22, + "end": 89.26, + "confidence": 0.982 + }, + { + "text": "got", + "start": 89.26, + "end": 89.3, + "confidence": 0.905 + }, + { + "text": "them,", + "start": 89.3, + "end": 89.34, + "confidence": 0.971 + }, + { + "text": "got", + "start": 89.34, + "end": 89.38, + "confidence": 0.866 + }, + { + "text": "them,", + "start": 89.38, + "end": 89.42, + "confidence": 0.959 + }, + { + "text": "got", + "start": 89.42, + "end": 89.46, + "confidence": 0.845 + }, + { + "text": "them,", + "start": 89.46, + "end": 89.5, + "confidence": 0.96 + }, + { + "text": "got", + "start": 89.5, + "end": 89.54, + "confidence": 0.861 + }, + { + "text": "them,", + "start": 89.54, + "end": 89.58, + "confidence": 0.963 + }, + { + "text": "got", + "start": 89.58, + "end": 89.62, + "confidence": 0.88 + }, + { + "text": "them,", + "start": 89.62, + "end": 89.66, + "confidence": 0.965 + }, + { + "text": "got", + "start": 89.66, + "end": 89.7, + "confidence": 0.888 + }, + { + "text": "them,", + "start": 89.7, + "end": 89.74, + "confidence": 0.966 + }, + { + "text": "got", + "start": 89.74, + "end": 89.78, + "confidence": 0.887 + }, + { + "text": "them,", + "start": 89.78, + "end": 89.82, + "confidence": 0.966 + }, + { + "text": "got", + "start": 89.82, + "end": 89.86, + "confidence": 0.875 + }, + { + "text": "them,", + "start": 89.86, + "end": 89.9, + "confidence": 0.968 + }, + { + "text": "got", + "start": 89.9, + "end": 89.94, + "confidence": 0.871 + }, + { + "text": "them,", + "start": 89.94, + "end": 89.98, + "confidence": 0.968 + }, + { + "text": "got", + "start": 89.98, + "end": 90.02, + "confidence": 0.868 + }, + { + "text": "them,", + "start": 90.02, + "end": 90.06, + "confidence": 0.966 + }, + { + "text": "got", + "start": 90.06, + "end": 90.1, + "confidence": 0.865 + }, + { + "text": "them,", + "start": 90.1, + "end": 90.14, + "confidence": 0.964 + }, + { + "text": "got", + "start": 90.14, + "end": 90.18, + "confidence": 0.865 + }, + { + "text": "them,", + "start": 90.18, + "end": 90.22, + "confidence": 0.965 + }, + { + "text": "got", + "start": 90.22, + "end": 90.26, + "confidence": 0.86 + }, + { + "text": "them,", + "start": 90.26, + "end": 90.3, + "confidence": 0.965 + }, + { + "text": "got", + "start": 90.3, + "end": 90.34, + "confidence": 0.867 + }, + { + "text": "them,", + "start": 90.34, + "end": 90.38, + "confidence": 0.966 + }, + { + "text": "got", + "start": 90.38, + "end": 90.42, + "confidence": 0.866 + }, + { + "text": "them,", + "start": 90.42, + "end": 90.46, + "confidence": 0.967 + }, + { + "text": "got", + "start": 90.46, + "end": 90.5, + "confidence": 0.866 + }, + { + "text": "them,", + "start": 90.5, + "end": 90.54, + "confidence": 0.968 + }, + { + "text": "got", + "start": 90.54, + "end": 90.58, + "confidence": 0.87 + }, + { + "text": "them,", + "start": 90.58, + "end": 90.62, + "confidence": 0.969 + }, + { + "text": "got", + "start": 90.62, + "end": 90.66, + "confidence": 0.874 + }, + { + "text": "them,", + "start": 90.66, + "end": 90.7, + "confidence": 0.971 + }, + { + "text": "got", + "start": 90.7, + "end": 90.74, + "confidence": 0.874 + }, + { + "text": "them,", + "start": 90.74, + "end": 90.78, + "confidence": 0.971 + }, + { + "text": "got", + "start": 90.78, + "end": 90.82, + "confidence": 0.88 + }, + { + "text": "them,", + "start": 90.82, + "end": 90.86, + "confidence": 0.971 + }, + { + "text": "got", + "start": 90.86, + "end": 90.9, + "confidence": 0.884 + }, + { + "text": "them,", + "start": 90.9, + "end": 90.94, + "confidence": 0.973 + }, + { + "text": "got", + "start": 90.94, + "end": 90.98, + "confidence": 0.883 + }, + { + "text": "them,", + "start": 90.98, + "end": 91.02, + "confidence": 0.973 + }, + { + "text": "got", + "start": 91.02, + "end": 91.06, + "confidence": 0.884 + }, + { + "text": "them,", + "start": 91.06, + "end": 91.1, + "confidence": 0.973 + }, + { + "text": "got", + "start": 91.1, + "end": 91.14, + "confidence": 0.893 + }, + { + "text": "them,", + "start": 91.14, + "end": 91.18, + "confidence": 0.975 + }, + { + "text": "got", + "start": 91.18, + "end": 91.22, + "confidence": 0.894 + }, + { + "text": "them,", + "start": 91.22, + "end": 91.26, + "confidence": 0.975 + }, + { + "text": "got", + "start": 91.26, + "end": 91.3, + "confidence": 0.9 + }, + { + "text": "them,", + "start": 91.3, + "end": 91.34, + "confidence": 0.976 + }, + { + "text": "got", + "start": 91.34, + "end": 91.38, + "confidence": 0.906 + }, + { + "text": "them,", + "start": 91.38, + "end": 91.42, + "confidence": 0.977 + }, + { + "text": "got", + "start": 91.42, + "end": 91.46, + "confidence": 0.905 + }, + { + "text": "them,", + "start": 91.46, + "end": 91.5, + "confidence": 0.978 + }, + { + "text": "got", + "start": 91.5, + "end": 91.54, + "confidence": 0.915 + }, + { + "text": "them,", + "start": 91.54, + "end": 91.58, + "confidence": 0.979 + }, + { + "text": "got", + "start": 91.58, + "end": 91.62, + "confidence": 0.92 + }, + { + "text": "them,", + "start": 91.62, + "end": 91.66, + "confidence": 0.98 + }, + { + "text": "got", + "start": 91.66, + "end": 91.7, + "confidence": 0.922 + }, + { + "text": "them,", + "start": 91.7, + "end": 91.74, + "confidence": 0.981 + }, + { + "text": "got", + "start": 91.74, + "end": 91.78, + "confidence": 0.925 + }, + { + "text": "them,", + "start": 91.78, + "end": 91.82, + "confidence": 0.982 + }, + { + "text": "got", + "start": 91.82, + "end": 91.86, + "confidence": 0.932 + }, + { + "text": "them,", + "start": 91.86, + "end": 91.9, + "confidence": 0.983 + }, + { + "text": "got", + "start": 91.9, + "end": 91.94, + "confidence": 0.936 + }, + { + "text": "them,", + "start": 91.94, + "end": 91.98, + "confidence": 0.984 + }, + { + "text": "got", + "start": 91.98, + "end": 92.02, + "confidence": 0.935 + }, + { + "text": "them,", + "start": 92.02, + "end": 92.06, + "confidence": 0.985 + }, + { + "text": "got", + "start": 92.06, + "end": 92.1, + "confidence": 0.941 + }, + { + "text": "them,", + "start": 92.1, + "end": 92.14, + "confidence": 0.986 + }, + { + "text": "got", + "start": 92.14, + "end": 92.18, + "confidence": 0.946 + }, + { + "text": "them,", + "start": 92.18, + "end": 92.22, + "confidence": 0.986 + }, + { + "text": "got", + "start": 92.22, + "end": 92.26, + "confidence": 0.95 + }, + { + "text": "them,", + "start": 92.26, + "end": 92.3, + "confidence": 0.987 + }, + { + "text": "got", + "start": 92.3, + "end": 92.34, + "confidence": 0.951 + }, + { + "text": "them,", + "start": 92.34, + "end": 92.38, + "confidence": 0.987 + }, + { + "text": "got", + "start": 92.38, + "end": 92.42, + "confidence": 0.954 + }, + { + "text": "them,", + "start": 92.42, + "end": 92.46, + "confidence": 0.989 + }, + { + "text": "got", + "start": 92.46, + "end": 92.5, + "confidence": 0.959 + }, + { + "text": "them,", + "start": 92.5, + "end": 92.54, + "confidence": 0.989 + }, + { + "text": "got", + "start": 92.54, + "end": 92.58, + "confidence": 0.959 + }, + { + "text": "them,", + "start": 92.58, + "end": 92.62, + "confidence": 0.99 + }, + { + "text": "got", + "start": 92.62, + "end": 92.66, + "confidence": 0.963 + }, + { + "text": "them,", + "start": 92.66, + "end": 92.7, + "confidence": 0.991 + }, + { + "text": "got", + "start": 92.7, + "end": 92.74, + "confidence": 0.966 + }, + { + "text": "them,", + "start": 92.74, + "end": 92.78, + "confidence": 0.992 + }, + { + "text": "got", + "start": 92.78, + "end": 92.82, + "confidence": 0.967 + }, + { + "text": "them,", + "start": 92.82, + "end": 92.86, + "confidence": 0.992 + }, + { + "text": "got", + "start": 92.86, + "end": 92.9, + "confidence": 0.97 + }, + { + "text": "them,", + "start": 92.9, + "end": 92.94, + "confidence": 0.992 + }, + { + "text": "got", + "start": 92.94, + "end": 92.98, + "confidence": 0.971 + }, + { + "text": "them,", + "start": 92.98, + "end": 93.02, + "confidence": 0.993 + }, + { + "text": "got", + "start": 93.02, + "end": 93.06, + "confidence": 0.97 + }, + { + "text": "them,", + "start": 93.06, + "end": 93.1, + "confidence": 0.993 + }, + { + "text": "got", + "start": 93.1, + "end": 93.14, + "confidence": 0.973 + }, + { + "text": "them,", + "start": 93.14, + "end": 93.18, + "confidence": 0.993 + }, + { + "text": "got", + "start": 93.18, + "end": 93.22, + "confidence": 0.974 + }, + { + "text": "them,", + "start": 93.22, + "end": 93.26, + "confidence": 0.994 + }, + { + "text": "got", + "start": 93.26, + "end": 93.3, + "confidence": 0.974 + }, + { + "text": "them,", + "start": 93.3, + "end": 93.34, + "confidence": 0.994 + }, + { + "text": "got", + "start": 93.34, + "end": 93.38, + "confidence": 0.976 + }, + { + "text": "them,", + "start": 93.38, + "end": 93.42, + "confidence": 0.994 + }, + { + "text": "got", + "start": 93.42, + "end": 93.46, + "confidence": 0.978 + }, + { + "text": "them,", + "start": 93.46, + "end": 93.5, + "confidence": 0.995 + }, + { + "text": "got", + "start": 93.5, + "end": 93.54, + "confidence": 0.979 + }, + { + "text": "them,", + "start": 93.54, + "end": 93.58, + "confidence": 0.995 + }, + { + "text": "got", + "start": 93.58, + "end": 93.62, + "confidence": 0.98 + }, + { + "text": "them,", + "start": 93.62, + "end": 93.66, + "confidence": 0.995 + }, + { + "text": "got", + "start": 93.66, + "end": 93.7, + "confidence": 0.981 + }, + { + "text": "them,", + "start": 93.7, + "end": 93.74, + "confidence": 0.995 + }, + { + "text": "got", + "start": 93.74, + "end": 93.78, + "confidence": 0.98 + }, + { + "text": "them,", + "start": 93.78, + "end": 93.82, + "confidence": 0.995 + }, + { + "text": "got", + "start": 93.82, + "end": 93.86, + "confidence": 0.982 + }, + { + "text": "them,", + "start": 93.86, + "end": 93.9, + "confidence": 0.996 + }, + { + "text": "got", + "start": 93.9, + "end": 93.94, + "confidence": 0.982 + }, + { + "text": "them,", + "start": 93.94, + "end": 93.98, + "confidence": 0.996 + }, + { + "text": "got", + "start": 93.98, + "end": 94.02, + "confidence": 0.984 + }, + { + "text": "them,", + "start": 94.02, + "end": 94.06, + "confidence": 0.996 + }, + { + "text": "got", + "start": 94.06, + "end": 94.1, + "confidence": 0.984 + }, + { + "text": "them,", + "start": 94.1, + "end": 94.14, + "confidence": 0.996 + }, + { + "text": "got", + "start": 94.14, + "end": 94.18, + "confidence": 0.985 + }, + { + "text": "them,", + "start": 94.18, + "end": 94.22, + "confidence": 0.996 + }, + { + "text": "got", + "start": 94.22, + "end": 94.26, + "confidence": 0.986 + }, + { + "text": "them,", + "start": 94.26, + "end": 94.3, + "confidence": 0.996 + }, + { + "text": "got", + "start": 94.3, + "end": 94.34, + "confidence": 0.986 + }, + { + "text": "them,", + "start": 94.34, + "end": 94.38, + "confidence": 0.996 + }, + { + "text": "got", + "start": 94.38, + "end": 94.42, + "confidence": 0.987 + }, + { + "text": "them", + "start": 94.42, + "end": 115.0, + "confidence": 0.996 + } + ] + } + ], + "language": "en" +} \ No newline at end of file diff --git a/tests/expected/corner_cases/accurate.tiny_apollo11.mp3.words.json b/tests/expected/corner_cases/accurate.tiny_apollo11.mp3.words.json new file mode 100644 index 0000000000000000000000000000000000000000..7ad6577bcc1c1e5d972ee3a7a905627ce5e41386 --- /dev/null +++ b/tests/expected/corner_cases/accurate.tiny_apollo11.mp3.words.json @@ -0,0 +1,1261 @@ +{ + "text": " I'm all around my business and we got a recommendation for you on your door to the VA We have 18A's Okay, okay, I think I'll just get him or if they like just want to go on the Yeah, now what you want is on having a B1 And you just get the other one on my Now when we're here, we're going to go on the Yeah Okay, we want to hear that This is it, we know we just You can hit that That's how much you've ordered in that So I guess I'm working on my position but it's not Oh my god Okay, no problem No idea No idea Okay Okay", + "segments": [ + { + "id": 0, + "seek": 0, + "start": 0.6, + "end": 5.36, + "text": " I'm all around my business and we got a recommendation for you on your door to the VA", + "tokens": [ + 50364, + 286, + 478, + 439, + 926, + 452, + 1606, + 293, + 321, + 658, + 257, + 11879, + 337, + 291, + 322, + 428, + 2853, + 281, + 264, + 18527, + 50628 + ], + "temperature": 0.0, + "avg_logprob": -1.1827944879946501, + "compression_ratio": 1.52020202020202, + "no_speech_prob": 0.35403239727020264, + "confidence": 0.324, + "words": [ + { + "text": "I'm", + "start": 0.6, + "end": 0.82, + "confidence": 0.168 + }, + { + "text": "all", + "start": 0.82, + "end": 1.06, + "confidence": 0.082 + }, + { + "text": "around", + "start": 1.06, + "end": 1.28, + "confidence": 0.104 + }, + { + "text": "my", + "start": 1.28, + "end": 1.46, + "confidence": 0.128 + }, + { + "text": "business", + "start": 1.46, + "end": 1.72, + "confidence": 0.342 + }, + { + "text": "and", + "start": 1.72, + "end": 1.92, + "confidence": 0.613 + }, + { + "text": "we", + "start": 1.92, + "end": 1.98, + "confidence": 0.937 + }, + { + "text": "got", + "start": 1.98, + "end": 2.18, + "confidence": 0.4 + }, + { + "text": "a", + "start": 2.18, + "end": 2.4, + "confidence": 0.639 + }, + { + "text": "recommendation", + "start": 2.4, + "end": 3.06, + "confidence": 0.599 + }, + { + "text": "for", + "start": 3.06, + "end": 3.5, + "confidence": 0.371 + }, + { + "text": "you", + "start": 3.5, + "end": 3.68, + "confidence": 0.974 + }, + { + "text": "on", + "start": 3.68, + "end": 3.88, + "confidence": 0.805 + }, + { + "text": "your", + "start": 3.88, + "end": 4.24, + "confidence": 0.562 + }, + { + "text": "door", + "start": 4.24, + "end": 4.68, + "confidence": 0.145 + }, + { + "text": "to", + "start": 4.68, + "end": 4.88, + "confidence": 0.182 + }, + { + "text": "the", + "start": 4.88, + "end": 5.08, + "confidence": 0.501 + }, + { + "text": "VA", + "start": 5.08, + "end": 5.36, + "confidence": 0.249 + } + ] + }, + { + "id": 1, + "seek": 0, + "start": 5.36, + "end": 6.94, + "text": " We have 18A's", + "tokens": [ + 50628, + 492, + 362, + 2443, + 32, + 311, + 50714 + ], + "temperature": 0.0, + "avg_logprob": -1.1827944879946501, + "compression_ratio": 1.52020202020202, + "no_speech_prob": 0.35403239727020264, + "confidence": 0.175, + "words": [ + { + "text": "We", + "start": 5.36, + "end": 5.74, + "confidence": 0.042 + }, + { + "text": "have", + "start": 5.74, + "end": 5.76, + "confidence": 0.652 + }, + { + "text": "18A's", + "start": 5.76, + "end": 6.94, + "confidence": 0.182 + } + ] + }, + { + "id": 2, + "seek": 0, + "start": 12.0, + "end": 16.79, + "text": " Okay, okay, I think I'll just get him or if they like just want to go on the", + "tokens": [ + 50914, + 1033, + 11, + 1392, + 11, + 286, + 519, + 286, + 603, + 445, + 483, + 796, + 420, + 498, + 436, + 411, + 445, + 528, + 281, + 352, + 322, + 264, + 51197 + ], + "temperature": 0.0, + "avg_logprob": -1.1827944879946501, + "compression_ratio": 1.52020202020202, + "no_speech_prob": 0.35403239727020264, + "confidence": 0.327, + "words": [ + { + "text": "Okay,", + "start": 12.0, + "end": 12.38, + "confidence": 0.662 + }, + { + "text": "okay,", + "start": 12.88, + "end": 13.12, + "confidence": 0.291 + }, + { + "text": "I", + "start": 13.12, + "end": 13.3, + "confidence": 0.209 + }, + { + "text": "think", + "start": 13.3, + "end": 13.58, + "confidence": 0.263 + }, + { + "text": "I'll", + "start": 13.58, + "end": 13.9, + "confidence": 0.2 + }, + { + "text": "just", + "start": 13.9, + "end": 14.1, + "confidence": 0.17 + }, + { + "text": "get", + "start": 14.1, + "end": 14.28, + "confidence": 0.248 + }, + { + "text": "him", + "start": 14.28, + "end": 14.52, + "confidence": 0.153 + }, + { + "text": "or", + "start": 14.52, + "end": 14.74, + "confidence": 0.199 + }, + { + "text": "if", + "start": 14.74, + "end": 14.94, + "confidence": 0.088 + }, + { + "text": "they", + "start": 14.94, + "end": 15.44, + "confidence": 0.607 + }, + { + "text": "like", + "start": 15.44, + "end": 15.74, + "confidence": 0.2 + }, + { + "text": "just", + "start": 15.74, + "end": 15.96, + "confidence": 0.462 + }, + { + "text": "want", + "start": 15.96, + "end": 16.18, + "confidence": 0.765 + }, + { + "text": "to", + "start": 16.18, + "end": 16.36, + "confidence": 0.91 + }, + { + "text": "go", + "start": 16.36, + "end": 16.56, + "confidence": 0.948 + }, + { + "text": "on", + "start": 16.56, + "end": 16.7, + "confidence": 0.566 + }, + { + "text": "the", + "start": 16.7, + "end": 16.79, + "confidence": 0.585 + } + ] + }, + { + "id": 3, + "seek": 0, + "start": 16.79, + "end": 19.0, + "text": " Yeah, now what you want is on having a B1", + "tokens": [ + 51197, + 865, + 11, + 586, + 437, + 291, + 528, + 307, + 322, + 1419, + 257, + 363, + 16, + 51322 + ], + "temperature": 0.0, + "avg_logprob": -1.1827944879946501, + "compression_ratio": 1.52020202020202, + "no_speech_prob": 0.35403239727020264, + "confidence": 0.471, + "words": [ + { + "text": "Yeah,", + "start": 16.79, + "end": 17.1, + "confidence": 0.28 + }, + { + "text": "now", + "start": 17.18, + "end": 17.3, + "confidence": 0.365 + }, + { + "text": "what", + "start": 17.3, + "end": 17.48, + "confidence": 0.743 + }, + { + "text": "you", + "start": 17.48, + "end": 17.62, + "confidence": 0.932 + }, + { + "text": "want", + "start": 17.62, + "end": 17.84, + "confidence": 0.743 + }, + { + "text": "is", + "start": 17.84, + "end": 17.96, + "confidence": 0.674 + }, + { + "text": "on", + "start": 17.96, + "end": 18.16, + "confidence": 0.327 + }, + { + "text": "having", + "start": 18.16, + "end": 18.44, + "confidence": 0.563 + }, + { + "text": "a", + "start": 18.44, + "end": 18.76, + "confidence": 0.287 + }, + { + "text": "B1", + "start": 18.76, + "end": 19.0, + "confidence": 0.37 + } + ] + }, + { + "id": 4, + "seek": 0, + "start": 19.0, + "end": 21.88, + "text": " And you just get the other one on my", + "tokens": [ + 51322, + 400, + 291, + 445, + 483, + 264, + 661, + 472, + 322, + 452, + 51462 + ], + "temperature": 0.0, + "avg_logprob": -1.1827944879946501, + "compression_ratio": 1.52020202020202, + "no_speech_prob": 0.35403239727020264, + "confidence": 0.516, + "words": [ + { + "text": "And", + "start": 19.0, + "end": 20.26, + "confidence": 0.272 + }, + { + "text": "you", + "start": 20.26, + "end": 20.4, + "confidence": 0.846 + }, + { + "text": "just", + "start": 20.4, + "end": 20.64, + "confidence": 0.694 + }, + { + "text": "get", + "start": 20.64, + "end": 20.8, + "confidence": 0.134 + }, + { + "text": "the", + "start": 20.8, + "end": 20.9, + "confidence": 0.65 + }, + { + "text": "other", + "start": 20.9, + "end": 21.08, + "confidence": 0.937 + }, + { + "text": "one", + "start": 21.08, + "end": 21.26, + "confidence": 0.976 + }, + { + "text": "on", + "start": 21.26, + "end": 21.66, + "confidence": 0.872 + }, + { + "text": "my", + "start": 21.66, + "end": 21.88, + "confidence": 0.232 + } + ] + }, + { + "id": 5, + "seek": 0, + "start": 22.12, + "end": 25.36, + "text": " Now when we're here, we're going to go on the", + "tokens": [ + 51462, + 823, + 562, + 321, + 434, + 510, + 11, + 321, + 434, + 516, + 281, + 352, + 322, + 264, + 51616 + ], + "temperature": 0.0, + "avg_logprob": -1.1827944879946501, + "compression_ratio": 1.52020202020202, + "no_speech_prob": 0.35403239727020264, + "confidence": 0.336, + "words": [ + { + "text": "Now", + "start": 22.12, + "end": 22.8, + "confidence": 0.168 + }, + { + "text": "when", + "start": 22.8, + "end": 23.04, + "confidence": 0.35 + }, + { + "text": "we're", + "start": 23.04, + "end": 23.24, + "confidence": 0.745 + }, + { + "text": "here,", + "start": 23.24, + "end": 23.44, + "confidence": 0.492 + }, + { + "text": "we're", + "start": 23.66, + "end": 23.88, + "confidence": 0.293 + }, + { + "text": "going", + "start": 23.88, + "end": 23.94, + "confidence": 0.291 + }, + { + "text": "to", + "start": 23.94, + "end": 24.38, + "confidence": 0.88 + }, + { + "text": "go", + "start": 24.38, + "end": 24.72, + "confidence": 0.119 + }, + { + "text": "on", + "start": 24.72, + "end": 25.34, + "confidence": 0.133 + }, + { + "text": "the", + "start": 25.34, + "end": 25.36, + "confidence": 0.364 + } + ] + }, + { + "id": 6, + "seek": 3000, + "start": 31.36, + "end": 31.56, + "text": " Yeah", + "tokens": [ + 50364, + 865, + 50464 + ], + "temperature": 0.0, + "avg_logprob": -1.6116297245025635, + "compression_ratio": 0.3333333333333333, + "no_speech_prob": 0.29405874013900757, + "confidence": 0.057, + "words": [ + { + "text": "Yeah", + "start": 31.36, + "end": 31.56, + "confidence": 0.057 + } + ] + }, + { + "id": 7, + "seek": 6000, + "start": 62.7, + "end": 64.14, + "text": " Okay, we want to hear that", + "tokens": [ + 50364, + 1033, + 11, + 321, + 528, + 281, + 1568, + 300, + 50564 + ], + "temperature": 0.0, + "avg_logprob": -0.9387273416890727, + "compression_ratio": 1.4172185430463575, + "no_speech_prob": 0.10345567017793655, + "confidence": 0.355, + "words": [ + { + "text": "Okay,", + "start": 62.7, + "end": 62.72, + "confidence": 0.125 + }, + { + "text": "we", + "start": 63.1, + "end": 63.32, + "confidence": 0.238 + }, + { + "text": "want", + "start": 63.32, + "end": 63.62, + "confidence": 0.529 + }, + { + "text": "to", + "start": 63.62, + "end": 63.72, + "confidence": 0.571 + }, + { + "text": "hear", + "start": 63.72, + "end": 63.84, + "confidence": 0.245 + }, + { + "text": "that", + "start": 63.84, + "end": 64.14, + "confidence": 0.92 + } + ] + }, + { + "id": 8, + "seek": 6000, + "start": 64.46, + "end": 66.82, + "text": " This is it, we know we just", + "tokens": [ + 50564, + 639, + 307, + 309, + 11, + 321, + 458, + 321, + 445, + 50714 + ], + "temperature": 0.0, + "avg_logprob": -0.9387273416890727, + "compression_ratio": 1.4172185430463575, + "no_speech_prob": 0.10345567017793655, + "confidence": 0.459, + "words": [ + { + "text": "This", + "start": 64.46, + "end": 64.72, + "confidence": 0.243 + }, + { + "text": "is", + "start": 64.72, + "end": 64.94, + "confidence": 0.663 + }, + { + "text": "it,", + "start": 64.94, + "end": 65.12, + "confidence": 0.243 + }, + { + "text": "we", + "start": 65.22, + "end": 65.42, + "confidence": 0.475 + }, + { + "text": "know", + "start": 65.42, + "end": 65.62, + "confidence": 0.696 + }, + { + "text": "we", + "start": 65.62, + "end": 65.88, + "confidence": 0.823 + }, + { + "text": "just", + "start": 65.88, + "end": 66.82, + "confidence": 0.405 + } + ] + }, + { + "id": 9, + "seek": 6000, + "start": 66.86, + "end": 68.3, + "text": " You can hit that", + "tokens": [ + 50714, + 509, + 393, + 2045, + 300, + 50764 + ], + "temperature": 0.0, + "avg_logprob": -0.9387273416890727, + "compression_ratio": 1.4172185430463575, + "no_speech_prob": 0.10345567017793655, + "confidence": 0.329, + "words": [ + { + "text": "You", + "start": 66.86, + "end": 67.14, + "confidence": 0.246 + }, + { + "text": "can", + "start": 67.14, + "end": 67.32, + "confidence": 0.577 + }, + { + "text": "hit", + "start": 67.32, + "end": 67.52, + "confidence": 0.126 + }, + { + "text": "that", + "start": 67.52, + "end": 68.3, + "confidence": 0.656 + } + ] + }, + { + "id": 10, + "seek": 6000, + "start": 68.32, + "end": 69.46, + "text": " That's how much you've ordered in that", + "tokens": [ + 50764, + 663, + 311, + 577, + 709, + 291, + 600, + 8866, + 294, + 300, + 50864 + ], + "temperature": 0.0, + "avg_logprob": -0.9387273416890727, + "compression_ratio": 1.4172185430463575, + "no_speech_prob": 0.10345567017793655, + "confidence": 0.3, + "words": [ + { + "text": "That's", + "start": 68.32, + "end": 68.58, + "confidence": 0.262 + }, + { + "text": "how", + "start": 68.58, + "end": 68.6, + "confidence": 0.237 + }, + { + "text": "much", + "start": 68.6, + "end": 68.68, + "confidence": 0.974 + }, + { + "text": "you've", + "start": 68.68, + "end": 68.84, + "confidence": 0.416 + }, + { + "text": "ordered", + "start": 68.84, + "end": 69.02, + "confidence": 0.145 + }, + { + "text": "in", + "start": 69.02, + "end": 69.22, + "confidence": 0.204 + }, + { + "text": "that", + "start": 69.22, + "end": 69.46, + "confidence": 0.246 + } + ] + }, + { + "id": 11, + "seek": 6000, + "start": 70.4, + "end": 72.52, + "text": " So I guess I'm working on my position but it's not", + "tokens": [ + 50864, + 407, + 286, + 2041, + 286, + 478, + 1364, + 322, + 452, + 2535, + 457, + 309, + 311, + 406, + 51014 + ], + "temperature": 0.0, + "avg_logprob": -0.9387273416890727, + "compression_ratio": 1.4172185430463575, + "no_speech_prob": 0.10345567017793655, + "confidence": 0.458, + "words": [ + { + "text": "So", + "start": 70.4, + "end": 70.42, + "confidence": 0.914 + }, + { + "text": "I", + "start": 70.42, + "end": 70.54, + "confidence": 0.727 + }, + { + "text": "guess", + "start": 70.54, + "end": 70.8, + "confidence": 0.767 + }, + { + "text": "I'm", + "start": 70.8, + "end": 71.3, + "confidence": 0.363 + }, + { + "text": "working", + "start": 71.3, + "end": 71.32, + "confidence": 0.653 + }, + { + "text": "on", + "start": 71.32, + "end": 71.58, + "confidence": 0.396 + }, + { + "text": "my", + "start": 71.58, + "end": 71.74, + "confidence": 0.261 + }, + { + "text": "position", + "start": 71.74, + "end": 71.98, + "confidence": 0.081 + }, + { + "text": "but", + "start": 71.98, + "end": 72.18, + "confidence": 0.291 + }, + { + "text": "it's", + "start": 72.18, + "end": 72.38, + "confidence": 0.792 + }, + { + "text": "not", + "start": 72.38, + "end": 72.52, + "confidence": 0.585 + } + ] + }, + { + "id": 12, + "seek": 6000, + "start": 74.72, + "end": 75.22, + "text": " Oh my god", + "tokens": [ + 51014, + 876, + 452, + 3044, + 51114 + ], + "temperature": 0.0, + "avg_logprob": -0.9387273416890727, + "compression_ratio": 1.4172185430463575, + "no_speech_prob": 0.10345567017793655, + "confidence": 0.199, + "words": [ + { + "text": "Oh", + "start": 74.72, + "end": 74.74, + "confidence": 0.145 + }, + { + "text": "my", + "start": 74.74, + "end": 75.08, + "confidence": 0.273 + }, + { + "text": "god", + "start": 75.08, + "end": 75.22, + "confidence": 0.2 + } + ] + }, + { + "id": 13, + "seek": 6000, + "start": 75.22, + "end": 76.64, + "text": " Okay, no problem", + "tokens": [ + 51114, + 1033, + 11, + 572, + 1154, + 51214 + ], + "temperature": 0.0, + "avg_logprob": -0.9387273416890727, + "compression_ratio": 1.4172185430463575, + "no_speech_prob": 0.10345567017793655, + "confidence": 0.623, + "words": [ + { + "text": "Okay,", + "start": 75.22, + "end": 75.9, + "confidence": 0.682 + }, + { + "text": "no", + "start": 76.26, + "end": 76.32, + "confidence": 0.365 + }, + { + "text": "problem", + "start": 76.32, + "end": 76.64, + "confidence": 0.97 + } + ] + }, + { + "id": 14, + "seek": 6000, + "start": 76.64, + "end": 77.5, + "text": " No idea", + "tokens": [ + 51214, + 883, + 1558, + 51264 + ], + "temperature": 0.0, + "avg_logprob": -0.9387273416890727, + "compression_ratio": 1.4172185430463575, + "no_speech_prob": 0.10345567017793655, + "confidence": 0.223, + "words": [ + { + "text": "No", + "start": 76.64, + "end": 77.28, + "confidence": 0.223 + }, + { + "text": "idea", + "start": 77.28, + "end": 77.5, + "confidence": 0.224 + } + ] + }, + { + "id": 15, + "seek": 6000, + "start": 78.06, + "end": 78.6, + "text": " No idea", + "tokens": [ + 51264, + 883, + 1558, + 51314 + ], + "temperature": 0.0, + "avg_logprob": -0.9387273416890727, + "compression_ratio": 1.4172185430463575, + "no_speech_prob": 0.10345567017793655, + "confidence": 0.282, + "words": [ + { + "text": "No", + "start": 78.06, + "end": 78.38, + "confidence": 0.105 + }, + { + "text": "idea", + "start": 78.38, + "end": 78.6, + "confidence": 0.76 + } + ] + }, + { + "id": 16, + "seek": 6000, + "start": 85.28, + "end": 85.58, + "text": " Okay", + "tokens": [ + 51614, + 1033, + 51664 + ], + "temperature": 0.0, + "avg_logprob": -0.9387273416890727, + "compression_ratio": 1.4172185430463575, + "no_speech_prob": 0.10345567017793655, + "confidence": 0.101, + "words": [ + { + "text": "Okay", + "start": 85.28, + "end": 85.58, + "confidence": 0.101 + } + ] + }, + { + "id": 17, + "seek": 6000, + "start": 86.6, + "end": 86.86, + "text": " Okay", + "tokens": [ + 51664, + 1033, + 51714 + ], + "temperature": 0.0, + "avg_logprob": -0.9387273416890727, + "compression_ratio": 1.4172185430463575, + "no_speech_prob": 0.10345567017793655, + "confidence": 0.159, + "words": [ + { + "text": "Okay", + "start": 86.6, + "end": 86.86, + "confidence": 0.159 + } + ] + } + ], + "language": "en", + "language_probs": { + "en": 0.90898597240448, + "zh": 0.0063686794601380825, + "de": 0.0015729529550299048, + "es": 0.0061727361753582954, + "ru": 0.0024746020790189505, + "ko": 0.004695970099419355, + "fr": 0.0016613693442195654, + "ja": 0.003055725945159793, + "pt": 0.002100167563185096, + "tr": 0.0005608535720966756, + "pl": 0.00023197913833428174, + "ca": 5.729480835725553e-05, + "nl": 0.0019272222416475415, + "ar": 0.0010980981169268489, + "sv": 0.0010980981169268489, + "it": 0.0002393429313087836, + "id": 0.0011873272014781833, + "hi": 0.00014977698447182775, + "fi": 0.0010076714679598808, + "vi": 0.005533204879611731, + "he": 0.00017239226144738495, + "uk": 0.0002932491188403219, + "el": 0.0003401749418117106, + "ms": 0.0010076714679598808, + "cs": 4.4621239794651046e-05, + "ro": 0.0002079447585856542, + "da": 0.0010980981169268489, + "hu": 0.0001657880056882277, + "ta": 0.00026492850156500936, + "no": 8.873992919689044e-05, + "th": 0.0017685183556750417, + "ur": 0.0001606872392585501, + "hr": 3.6135381378699094e-05, + "bg": 3.8767600926803425e-05, + "lt": 1.964646617125254e-05, + "la": 0.002067607594653964, + "mi": 0.001782389241270721, + "ml": 0.001432189834304154, + "cy": 0.002436236944049597, + "sk": 8.650221388961654e-06, + "te": 9.084433986572549e-05, + "fa": 7.186378206824884e-05, + "lv": 2.4260149075416848e-05, + "bn": 8.01698406576179e-05, + "sr": 1.1869727131852414e-05, + "az": 8.416896889684722e-06, + "sl": 3.18893653457053e-05, + "kn": 5.105106083647115e-06, + "et": 1.059847363649169e-05, + "mk": 5.2466243687376846e-06, + "br": 0.0005696857697330415, + "eu": 1.7203019524458796e-05, + "is": 3.7282443372532725e-05, + "hy": 1.7203019524458796e-05, + "ne": 4.567940050037578e-05, + "mn": 0.00018640047346707433, + "bs": 2.7923257221118547e-05, + "kk": 4.5405749915516935e-06, + "sq": 2.5030247343238443e-05, + "sw": 9.670329018263146e-05, + "gl": 0.00016971956938505173, + "mr": 1.874678855529055e-05, + "pa": 6.182035122037632e-06, + "si": 0.00013425922952592373, + "km": 0.0008033857448026538, + "sn": 0.00027548204525373876, + "yo": 0.00018494989490136504, + "so": 4.215781245875405e-06, + "af": 8.01698406576179e-05, + "oc": 3.18893653457053e-05, + "ka": 8.221919415518641e-06, + "be": 1.7203019524458796e-05, + "tg": 1.2656181525017018e-07, + "sd": 3.0908227927284315e-05, + "gu": 3.4950057852256577e-06, + "am": 1.1685703611874487e-05, + "yi": 0.00014977698447182775, + "lo": 2.8809638024540618e-05, + "uz": 1.9721213551093797e-09, + "fo": 0.00045419312664307654, + "ht": 0.00015574341523461044, + "ps": 9.316655450675171e-06, + "tk": 1.7671988317147225e-08, + "nn": 0.015158776193857193, + "mt": 1.2439366400940344e-05, + "sa": 9.446316107641906e-05, + "lb": 1.3684594080132229e-07, + "my": 0.00024311205197591335, + "bo": 0.00028422678587958217, + "tl": 0.0014776524621993303, + "mg": 3.611920007529079e-08, + "as": 1.2635258826776408e-05, + "tt": 1.3765013306965557e-07, + "haw": 0.010665531270205975, + "ln": 9.956344001693651e-06, + "ha": 1.6636236921385716e-07, + "ba": 1.7880301683703692e-08, + "jw": 0.004480925854295492, + "su": 1.108212259737229e-07 + } +} \ No newline at end of file diff --git a/tests/expected/corner_cases/arabic.mp3.words.json b/tests/expected/corner_cases/arabic.mp3.words.json new file mode 100644 index 0000000000000000000000000000000000000000..f88ce5e8e84ed6fbfd0acd935f21544d17bd4c95 --- /dev/null +++ b/tests/expected/corner_cases/arabic.mp3.words.json @@ -0,0 +1,393 @@ +{ + "text": " حبّي أنصار الهدى حبّي ركب الفدا وطلّبي سأر الشاهد وطلّبي سأر الشاهد لمتى سنضل رقودا نغرق في النوم ونشخر وعن الآذان نسمّه ونغمّض كي لا نمسر", + "segments": [ + { + "id": 0, + "seek": 0, + "start": 1.8, + "end": 7.48, + "text": " حبّي أنصار الهدى", + "tokens": [ + 50364, + 11331, + 3555, + 11703, + 1829, + 14739, + 9381, + 9640, + 2423, + 3224, + 3215, + 7578, + 50714 + ], + "temperature": 0.0, + "avg_logprob": -0.5114130362486228, + "compression_ratio": 1.1842105263157894, + "no_speech_prob": 0.7993651032447815, + "confidence": 0.651, + "words": [ + { + "text": "حبّي", + "start": 1.8, + "end": 4.26, + "confidence": 0.436 + }, + { + "text": "أنصار", + "start": 4.26, + "end": 5.7, + "confidence": 0.795 + }, + { + "text": "الهدى", + "start": 5.7, + "end": 7.48, + "confidence": 0.837 + } + ] + }, + { + "id": 1, + "seek": 0, + "start": 9.24, + "end": 15.2, + "text": " حبّي ركب الفدا", + "tokens": [ + 50714, + 11331, + 3555, + 11703, + 1829, + 12602, + 4117, + 3555, + 27188, + 28259, + 51114 + ], + "temperature": 0.0, + "avg_logprob": -0.5114130362486228, + "compression_ratio": 1.1842105263157894, + "no_speech_prob": 0.7993651032447815, + "confidence": 0.829, + "words": [ + { + "text": "حبّي", + "start": 9.24, + "end": 12.58, + "confidence": 0.875 + }, + { + "text": "ركب", + "start": 12.58, + "end": 13.76, + "confidence": 0.853 + }, + { + "text": "الفدا", + "start": 13.76, + "end": 15.2, + "confidence": 0.711 + } + ] + }, + { + "id": 2, + "seek": 0, + "start": 18.86, + "end": 23.42, + "text": " وطلّبي سأر الشاهد", + "tokens": [ + 51114, + 4032, + 9566, + 1211, + 11703, + 21292, + 8608, + 10721, + 2288, + 25124, + 40294, + 3215, + 51514 + ], + "temperature": 0.0, + "avg_logprob": -0.5114130362486228, + "compression_ratio": 1.1842105263157894, + "no_speech_prob": 0.7993651032447815, + "confidence": 0.587, + "words": [ + { + "text": "وطلّبي", + "start": 18.86, + "end": 20.68, + "confidence": 0.54 + }, + { + "text": "سأر", + "start": 20.68, + "end": 21.78, + "confidence": 0.94 + }, + { + "text": "الشاهد", + "start": 21.78, + "end": 23.42, + "confidence": 0.421 + } + ] + }, + { + "id": 3, + "seek": 2300, + "start": 24.2, + "end": 28.96, + "text": " وطلّبي سأر الشاهد", + "tokens": [ + 50414, + 4032, + 9566, + 1211, + 11703, + 21292, + 8608, + 10721, + 2288, + 25124, + 40294, + 3215, + 50714 + ], + "temperature": 0.0, + "avg_logprob": -0.24054829042349288, + "compression_ratio": 1.3675213675213675, + "no_speech_prob": 0.008175775408744812, + "confidence": 0.875, + "words": [ + { + "text": "وطلّبي", + "start": 24.2, + "end": 25.98, + "confidence": 0.799 + }, + { + "text": "سأر", + "start": 25.98, + "end": 27.12, + "confidence": 0.95 + }, + { + "text": "الشاهد", + "start": 27.12, + "end": 28.96, + "confidence": 0.936 + } + ] + }, + { + "id": 4, + "seek": 2300, + "start": 30.88, + "end": 33.34, + "text": " لمتى سنضل رقودا", + "tokens": [ + 50714, + 32767, + 49975, + 8608, + 1863, + 11242, + 1211, + 12602, + 4587, + 23328, + 995, + 50864 + ], + "temperature": 0.0, + "avg_logprob": -0.24054829042349288, + "compression_ratio": 1.3675213675213675, + "no_speech_prob": 0.008175775408744812, + "confidence": 0.714, + "words": [ + { + "text": "لمتى", + "start": 30.88, + "end": 31.48, + "confidence": 0.692 + }, + { + "text": "سنضل", + "start": 31.48, + "end": 32.34, + "confidence": 0.754 + }, + { + "text": "رقودا", + "start": 32.34, + "end": 33.34, + "confidence": 0.686 + } + ] + }, + { + "id": 5, + "seek": 2300, + "start": 33.36, + "end": 35.88, + "text": " نغرق في النوم ونشخر", + "tokens": [ + 50864, + 8717, + 17082, + 2288, + 4587, + 8978, + 28239, + 20498, + 4032, + 1863, + 8592, + 34740, + 51014 + ], + "temperature": 0.0, + "avg_logprob": -0.24054829042349288, + "compression_ratio": 1.3675213675213675, + "no_speech_prob": 0.008175775408744812, + "confidence": 0.926, + "words": [ + { + "text": "نغرق", + "start": 33.36, + "end": 34.22, + "confidence": 0.901 + }, + { + "text": "في", + "start": 34.22, + "end": 34.44, + "confidence": 0.873 + }, + { + "text": "النوم", + "start": 34.44, + "end": 35.04, + "confidence": 0.974 + }, + { + "text": "ونشخر", + "start": 35.04, + "end": 35.88, + "confidence": 0.942 + } + ] + }, + { + "id": 6, + "seek": 2300, + "start": 36.24, + "end": 38.72, + "text": " وعن الآذان نسمّه", + "tokens": [ + 51014, + 4032, + 3615, + 1863, + 6024, + 95, + 8848, + 7649, + 8717, + 38251, + 11703, + 3224, + 51164 + ], + "temperature": 0.0, + "avg_logprob": -0.24054829042349288, + "compression_ratio": 1.3675213675213675, + "no_speech_prob": 0.008175775408744812, + "confidence": 0.765, + "words": [ + { + "text": "وعن", + "start": 36.24, + "end": 36.76, + "confidence": 0.923 + }, + { + "text": "الآذان", + "start": 36.76, + "end": 37.72, + "confidence": 0.82 + }, + { + "text": "نسمّه", + "start": 37.72, + "end": 38.72, + "confidence": 0.619 + } + ] + }, + { + "id": 7, + "seek": 2300, + "start": 38.88, + "end": 41.3, + "text": " ونغمّض كي لا نمسر", + "tokens": [ + 51164, + 4032, + 1863, + 17082, + 2304, + 11703, + 11242, + 9122, + 1829, + 20193, + 8717, + 2304, + 3794, + 2288, + 51264 + ], + "temperature": 0.0, + "avg_logprob": -0.24054829042349288, + "compression_ratio": 1.3675213675213675, + "no_speech_prob": 0.008175775408744812, + "confidence": 0.79, + "words": [ + { + "text": "ونغمّض", + "start": 38.88, + "end": 39.9, + "confidence": 0.91 + }, + { + "text": "كي", + "start": 39.9, + "end": 40.28, + "confidence": 0.833 + }, + { + "text": "لا", + "start": 40.28, + "end": 40.56, + "confidence": 0.804 + }, + { + "text": "نمسر", + "start": 40.56, + "end": 41.3, + "confidence": 0.619 + } + ] + } + ], + "language": "Arabic" +} \ No newline at end of file diff --git a/tests/expected/corner_cases/issue24_empty.wav.words.json b/tests/expected/corner_cases/issue24_empty.wav.words.json new file mode 100644 index 0000000000000000000000000000000000000000..2fb877fdb2d3636b652056874c7de84a30c4567f --- /dev/null +++ b/tests/expected/corner_cases/issue24_empty.wav.words.json @@ -0,0 +1,992 @@ +{ + "text": " I'm sorry. I'm sorry. I'm sorry. I'm sorry. I'm sorry. I'm sorry. I'm sorry. I'm sorry. I'm sorry. I'm sorry. I'm sorry. I'm sorry. I'm sorry. I'm sorry. I'm sorry. I'm sorry. I'm sorry. I'm sorry. I'm sorry. I'm sorry. I'm sorry. I'm sorry. I'm sorry. I'm sorry. I'm sorry. I'm sorry. I'm sorry. I'm sorry. I'm sorry.", + "segments": [ + { + "id": 0, + "seek": 0, + "start": 0.0, + "end": 0.96, + "text": " I'm sorry.", + "tokens": [ + 50363, + 314, + 1101, + 7926, + 13, + 50413 + ], + "temperature": 0.0, + "avg_logprob": -0.12369282679124312, + "compression_ratio": 13.25, + "no_speech_prob": 0.7658452391624451, + "confidence": 0.102, + "words": [ + { + "text": "I'm", + "start": 0.0, + "end": 0.94, + "confidence": 0.105 + }, + { + "text": "sorry", + "start": 0.94, + "end": 0.96, + "confidence": 0.096 + } + ] + }, + { + "id": 1, + "seek": 0, + "start": 0.96, + "end": 2.38, + "text": " I'm sorry.", + "tokens": [ + 50413, + 314, + 1101, + 7926, + 13, + 50463 + ], + "temperature": 0.0, + "avg_logprob": -0.12369282679124312, + "compression_ratio": 13.25, + "no_speech_prob": 0.7658452391624451, + "confidence": 0.405, + "words": [ + { + "text": "I'm", + "start": 0.96, + "end": 2.26, + "confidence": 0.353 + }, + { + "text": "sorry", + "start": 2.26, + "end": 2.38, + "confidence": 0.533 + } + ] + }, + { + "id": 2, + "seek": 0, + "start": 2.38, + "end": 2.42, + "text": " I'm sorry.", + "tokens": [ + 50463, + 314, + 1101, + 7926, + 13, + 50513 + ], + "temperature": 0.0, + "avg_logprob": -0.12369282679124312, + "compression_ratio": 13.25, + "no_speech_prob": 0.7658452391624451, + "confidence": 0.611, + "words": [ + { + "text": "I'm", + "start": 2.38, + "end": 2.4, + "confidence": 0.551 + }, + { + "text": "sorry", + "start": 2.4, + "end": 2.42, + "confidence": 0.752 + } + ] + }, + { + "id": 3, + "seek": 0, + "start": 3.0, + "end": 3.24, + "text": " I'm sorry.", + "tokens": [ + 50513, + 314, + 1101, + 7926, + 13, + 50563 + ], + "temperature": 0.0, + "avg_logprob": -0.12369282679124312, + "compression_ratio": 13.25, + "no_speech_prob": 0.7658452391624451, + "confidence": 0.765, + "words": [ + { + "text": "I'm", + "start": 3.0, + "end": 3.22, + "confidence": 0.714 + }, + { + "text": "sorry", + "start": 3.22, + "end": 3.24, + "confidence": 0.877 + } + ] + }, + { + "id": 4, + "seek": 0, + "start": 4.36, + "end": 4.48, + "text": " I'm sorry.", + "tokens": [ + 50563, + 314, + 1101, + 7926, + 13, + 50613 + ], + "temperature": 0.0, + "avg_logprob": -0.12369282679124312, + "compression_ratio": 13.25, + "no_speech_prob": 0.7658452391624451, + "confidence": 0.849, + "words": [ + { + "text": "I'm", + "start": 4.36, + "end": 4.42, + "confidence": 0.804 + }, + { + "text": "sorry", + "start": 4.42, + "end": 4.48, + "confidence": 0.947 + } + ] + }, + { + "id": 5, + "seek": 0, + "start": 5.5, + "end": 5.78, + "text": " I'm sorry.", + "tokens": [ + 50613, + 314, + 1101, + 7926, + 13, + 50663 + ], + "temperature": 0.0, + "avg_logprob": -0.12369282679124312, + "compression_ratio": 13.25, + "no_speech_prob": 0.7658452391624451, + "confidence": 0.89, + "words": [ + { + "text": "I'm", + "start": 5.5, + "end": 5.54, + "confidence": 0.852 + }, + { + "text": "sorry", + "start": 5.54, + "end": 5.78, + "confidence": 0.972 + } + ] + }, + { + "id": 6, + "seek": 0, + "start": 5.92, + "end": 6.8, + "text": " I'm sorry.", + "tokens": [ + 50663, + 314, + 1101, + 7926, + 13, + 50713 + ], + "temperature": 0.0, + "avg_logprob": -0.12369282679124312, + "compression_ratio": 13.25, + "no_speech_prob": 0.7658452391624451, + "confidence": 0.918, + "words": [ + { + "text": "I'm", + "start": 5.92, + "end": 6.14, + "confidence": 0.887 + }, + { + "text": "sorry", + "start": 6.14, + "end": 6.8, + "confidence": 0.983 + } + ] + }, + { + "id": 7, + "seek": 0, + "start": 7.5, + "end": 8.5, + "text": " I'm sorry.", + "tokens": [ + 50713, + 314, + 1101, + 7926, + 13, + 50763 + ], + "temperature": 0.0, + "avg_logprob": -0.12369282679124312, + "compression_ratio": 13.25, + "no_speech_prob": 0.7658452391624451, + "confidence": 0.941, + "words": [ + { + "text": "I'm", + "start": 7.5, + "end": 8.48, + "confidence": 0.919 + }, + { + "text": "sorry", + "start": 8.48, + "end": 8.5, + "confidence": 0.988 + } + ] + }, + { + "id": 8, + "seek": 0, + "start": 8.56, + "end": 9.48, + "text": " I'm sorry.", + "tokens": [ + 50763, + 314, + 1101, + 7926, + 13, + 50813 + ], + "temperature": 0.0, + "avg_logprob": -0.12369282679124312, + "compression_ratio": 13.25, + "no_speech_prob": 0.7658452391624451, + "confidence": 0.95, + "words": [ + { + "text": "I'm", + "start": 8.56, + "end": 9.0, + "confidence": 0.93 + }, + { + "text": "sorry", + "start": 9.0, + "end": 9.48, + "confidence": 0.991 + } + ] + }, + { + "id": 9, + "seek": 0, + "start": 9.54, + "end": 10.38, + "text": " I'm sorry.", + "tokens": [ + 50813, + 314, + 1101, + 7926, + 13, + 50863 + ], + "temperature": 0.0, + "avg_logprob": -0.12369282679124312, + "compression_ratio": 13.25, + "no_speech_prob": 0.7658452391624451, + "confidence": 0.963, + "words": [ + { + "text": "I'm", + "start": 9.54, + "end": 9.56, + "confidence": 0.948 + }, + { + "text": "sorry", + "start": 9.56, + "end": 10.38, + "confidence": 0.993 + } + ] + }, + { + "id": 10, + "seek": 0, + "start": 10.38, + "end": 11.36, + "text": " I'm sorry.", + "tokens": [ + 50863, + 314, + 1101, + 7926, + 13, + 50913 + ], + "temperature": 0.0, + "avg_logprob": -0.12369282679124312, + "compression_ratio": 13.25, + "no_speech_prob": 0.7658452391624451, + "confidence": 0.968, + "words": [ + { + "text": "I'm", + "start": 10.38, + "end": 11.34, + "confidence": 0.955 + }, + { + "text": "sorry", + "start": 11.34, + "end": 11.36, + "confidence": 0.994 + } + ] + }, + { + "id": 11, + "seek": 0, + "start": 11.36, + "end": 12.48, + "text": " I'm sorry.", + "tokens": [ + 50913, + 314, + 1101, + 7926, + 13, + 50963 + ], + "temperature": 0.0, + "avg_logprob": -0.12369282679124312, + "compression_ratio": 13.25, + "no_speech_prob": 0.7658452391624451, + "confidence": 0.978, + "words": [ + { + "text": "I'm", + "start": 11.36, + "end": 12.06, + "confidence": 0.969 + }, + { + "text": "sorry", + "start": 12.06, + "end": 12.48, + "confidence": 0.996 + } + ] + }, + { + "id": 12, + "seek": 0, + "start": 12.54, + "end": 12.93, + "text": " I'm sorry.", + "tokens": [ + 50963, + 314, + 1101, + 7926, + 13, + 51013 + ], + "temperature": 0.0, + "avg_logprob": -0.12369282679124312, + "compression_ratio": 13.25, + "no_speech_prob": 0.7658452391624451, + "confidence": 0.98, + "words": [ + { + "text": "I'm", + "start": 12.54, + "end": 12.56, + "confidence": 0.972 + }, + { + "text": "sorry", + "start": 12.56, + "end": 12.93, + "confidence": 0.996 + } + ] + }, + { + "id": 13, + "seek": 0, + "start": 12.93, + "end": 14.5, + "text": " I'm sorry.", + "tokens": [ + 51013, + 314, + 1101, + 7926, + 13, + 51063 + ], + "temperature": 0.0, + "avg_logprob": -0.12369282679124312, + "compression_ratio": 13.25, + "no_speech_prob": 0.7658452391624451, + "confidence": 0.979, + "words": [ + { + "text": "I'm", + "start": 12.93, + "end": 14.48, + "confidence": 0.971 + }, + { + "text": "sorry", + "start": 14.48, + "end": 14.5, + "confidence": 0.996 + } + ] + }, + { + "id": 14, + "seek": 0, + "start": 14.5, + "end": 15.46, + "text": " I'm sorry.", + "tokens": [ + 51063, + 314, + 1101, + 7926, + 13, + 51113 + ], + "temperature": 0.0, + "avg_logprob": -0.12369282679124312, + "compression_ratio": 13.25, + "no_speech_prob": 0.7658452391624451, + "confidence": 0.982, + "words": [ + { + "text": "I'm", + "start": 14.5, + "end": 15.42, + "confidence": 0.974 + }, + { + "text": "sorry", + "start": 15.42, + "end": 15.46, + "confidence": 0.996 + } + ] + }, + { + "id": 15, + "seek": 0, + "start": 15.46, + "end": 16.48, + "text": " I'm sorry.", + "tokens": [ + 51113, + 314, + 1101, + 7926, + 13, + 51163 + ], + "temperature": 0.0, + "avg_logprob": -0.12369282679124312, + "compression_ratio": 13.25, + "no_speech_prob": 0.7658452391624451, + "confidence": 0.983, + "words": [ + { + "text": "I'm", + "start": 15.46, + "end": 16.4, + "confidence": 0.976 + }, + { + "text": "sorry", + "start": 16.4, + "end": 16.48, + "confidence": 0.997 + } + ] + }, + { + "id": 16, + "seek": 0, + "start": 16.48, + "end": 17.5, + "text": " I'm sorry.", + "tokens": [ + 51163, + 314, + 1101, + 7926, + 13, + 51213 + ], + "temperature": 0.0, + "avg_logprob": -0.12369282679124312, + "compression_ratio": 13.25, + "no_speech_prob": 0.7658452391624451, + "confidence": 0.982, + "words": [ + { + "text": "I'm", + "start": 16.48, + "end": 17.48, + "confidence": 0.975 + }, + { + "text": "sorry", + "start": 17.48, + "end": 17.5, + "confidence": 0.997 + } + ] + }, + { + "id": 17, + "seek": 0, + "start": 17.54, + "end": 18.5, + "text": " I'm sorry.", + "tokens": [ + 51213, + 314, + 1101, + 7926, + 13, + 51263 + ], + "temperature": 0.0, + "avg_logprob": -0.12369282679124312, + "compression_ratio": 13.25, + "no_speech_prob": 0.7658452391624451, + "confidence": 0.984, + "words": [ + { + "text": "I'm", + "start": 17.54, + "end": 18.48, + "confidence": 0.978 + }, + { + "text": "sorry", + "start": 18.48, + "end": 18.5, + "confidence": 0.997 + } + ] + }, + { + "id": 18, + "seek": 0, + "start": 18.5, + "end": 19.48, + "text": " I'm sorry.", + "tokens": [ + 51263, + 314, + 1101, + 7926, + 13, + 51313 + ], + "temperature": 0.0, + "avg_logprob": -0.12369282679124312, + "compression_ratio": 13.25, + "no_speech_prob": 0.7658452391624451, + "confidence": 0.984, + "words": [ + { + "text": "I'm", + "start": 18.5, + "end": 19.34, + "confidence": 0.978 + }, + { + "text": "sorry", + "start": 19.34, + "end": 19.48, + "confidence": 0.997 + } + ] + }, + { + "id": 19, + "seek": 0, + "start": 19.64, + "end": 20.32, + "text": " I'm sorry.", + "tokens": [ + 51313, + 314, + 1101, + 7926, + 13, + 51363 + ], + "temperature": 0.0, + "avg_logprob": -0.12369282679124312, + "compression_ratio": 13.25, + "no_speech_prob": 0.7658452391624451, + "confidence": 0.986, + "words": [ + { + "text": "I'm", + "start": 19.64, + "end": 19.68, + "confidence": 0.98 + }, + { + "text": "sorry", + "start": 19.68, + "end": 20.32, + "confidence": 0.997 + } + ] + }, + { + "id": 20, + "seek": 0, + "start": 20.32, + "end": 20.36, + "text": " I'm sorry.", + "tokens": [ + 51363, + 314, + 1101, + 7926, + 13, + 51413 + ], + "temperature": 0.0, + "avg_logprob": -0.12369282679124312, + "compression_ratio": 13.25, + "no_speech_prob": 0.7658452391624451, + "confidence": 0.986, + "words": [ + { + "text": "I'm", + "start": 20.32, + "end": 20.34, + "confidence": 0.98 + }, + { + "text": "sorry", + "start": 20.34, + "end": 20.36, + "confidence": 0.997 + } + ] + }, + { + "id": 21, + "seek": 0, + "start": 21.58, + "end": 22.5, + "text": " I'm sorry.", + "tokens": [ + 51413, + 314, + 1101, + 7926, + 13, + 51463 + ], + "temperature": 0.0, + "avg_logprob": -0.12369282679124312, + "compression_ratio": 13.25, + "no_speech_prob": 0.7658452391624451, + "confidence": 0.987, + "words": [ + { + "text": "I'm", + "start": 21.58, + "end": 22.48, + "confidence": 0.983 + }, + { + "text": "sorry", + "start": 22.48, + "end": 22.5, + "confidence": 0.997 + } + ] + }, + { + "id": 22, + "seek": 0, + "start": 22.58, + "end": 23.46, + "text": " I'm sorry.", + "tokens": [ + 51463, + 314, + 1101, + 7926, + 13, + 51513 + ], + "temperature": 0.0, + "avg_logprob": -0.12369282679124312, + "compression_ratio": 13.25, + "no_speech_prob": 0.7658452391624451, + "confidence": 0.987, + "words": [ + { + "text": "I'm", + "start": 22.58, + "end": 22.6, + "confidence": 0.982 + }, + { + "text": "sorry", + "start": 22.6, + "end": 23.46, + "confidence": 0.997 + } + ] + }, + { + "id": 23, + "seek": 0, + "start": 23.46, + "end": 23.7, + "text": " I'm sorry.", + "tokens": [ + 51513, + 314, + 1101, + 7926, + 13, + 51563 + ], + "temperature": 0.0, + "avg_logprob": -0.12369282679124312, + "compression_ratio": 13.25, + "no_speech_prob": 0.7658452391624451, + "confidence": 0.988, + "words": [ + { + "text": "I'm", + "start": 23.46, + "end": 23.48, + "confidence": 0.984 + }, + { + "text": "sorry", + "start": 23.48, + "end": 23.7, + "confidence": 0.997 + } + ] + }, + { + "id": 24, + "seek": 0, + "start": 24.5, + "end": 24.54, + "text": " I'm sorry.", + "tokens": [ + 51563, + 314, + 1101, + 7926, + 13, + 51613 + ], + "temperature": 0.0, + "avg_logprob": -0.12369282679124312, + "compression_ratio": 13.25, + "no_speech_prob": 0.7658452391624451, + "confidence": 0.988, + "words": [ + { + "text": "I'm", + "start": 24.5, + "end": 24.52, + "confidence": 0.984 + }, + { + "text": "sorry", + "start": 24.52, + "end": 24.54, + "confidence": 0.998 + } + ] + }, + { + "id": 25, + "seek": 0, + "start": 24.54, + "end": 26.48, + "text": " I'm sorry.", + "tokens": [ + 51613, + 314, + 1101, + 7926, + 13, + 51663 + ], + "temperature": 0.0, + "avg_logprob": -0.12369282679124312, + "compression_ratio": 13.25, + "no_speech_prob": 0.7658452391624451, + "confidence": 0.985, + "words": [ + { + "text": "I'm", + "start": 24.54, + "end": 26.26, + "confidence": 0.979 + }, + { + "text": "sorry", + "start": 26.26, + "end": 26.48, + "confidence": 0.998 + } + ] + }, + { + "id": 26, + "seek": 0, + "start": 26.48, + "end": 27.5, + "text": " I'm sorry.", + "tokens": [ + 51663, + 314, + 1101, + 7926, + 13, + 51713 + ], + "temperature": 0.0, + "avg_logprob": -0.12369282679124312, + "compression_ratio": 13.25, + "no_speech_prob": 0.7658452391624451, + "confidence": 0.982, + "words": [ + { + "text": "I'm", + "start": 26.48, + "end": 27.48, + "confidence": 0.974 + }, + { + "text": "sorry", + "start": 27.48, + "end": 27.5, + "confidence": 0.998 + } + ] + }, + { + "id": 27, + "seek": 0, + "start": 27.5, + "end": 28.46, + "text": " I'm sorry.", + "tokens": [ + 51713, + 314, + 1101, + 7926, + 13, + 51763 + ], + "temperature": 0.0, + "avg_logprob": -0.12369282679124312, + "compression_ratio": 13.25, + "no_speech_prob": 0.7658452391624451, + "confidence": 0.975, + "words": [ + { + "text": "I'm", + "start": 27.5, + "end": 28.44, + "confidence": 0.964 + }, + { + "text": "sorry", + "start": 28.44, + "end": 28.46, + "confidence": 0.998 + } + ] + }, + { + "id": 28, + "seek": 0, + "start": 28.46, + "end": 29.32, + "text": " I'm sorry.", + "tokens": [ + 51763, + 314, + 1101, + 7926, + 13, + 51813 + ], + "temperature": 0.0, + "avg_logprob": -0.12369282679124312, + "compression_ratio": 13.25, + "no_speech_prob": 0.7658452391624451, + "confidence": 0.954, + "words": [ + { + "text": "I'm", + "start": 28.46, + "end": 29.3, + "confidence": 0.933 + }, + { + "text": "sorry", + "start": 29.3, + "end": 29.32, + "confidence": 0.998 + } + ] + } + ], + "language": "en" +} \ No newline at end of file diff --git a/tests/expected/corner_cases/large-v2.accurate_gloria.mp3.words.json b/tests/expected/corner_cases/large-v2.accurate_gloria.mp3.words.json new file mode 100644 index 0000000000000000000000000000000000000000..841b9608aec18ab79018280551a269d44efac00d --- /dev/null +++ b/tests/expected/corner_cases/large-v2.accurate_gloria.mp3.words.json @@ -0,0 +1,540 @@ +{ + "text": " Ella, my glorious love, how are you? Oh, I'm okay. I will be. I said she could stay with us tomorrow just until she feels better. Of course she can. No, this won't be for long. Well, if you can stay as long as you want, my love. I've really missed you. Pops.", + "segments": [ + { + "id": 0, + "seek": 0, + "start": 0.0, + "end": 6.28, + "text": " Ella, my glorious love, how are you?", + "tokens": [ + 50364, + 29261, + 11, + 452, + 24026, + 959, + 11, + 577, + 366, + 291, + 30, + 50664 + ], + "temperature": 0.0, + "avg_logprob": -0.3579153639546941, + "compression_ratio": 1.425414364640884, + "no_speech_prob": 0.24429768323898315, + "confidence": 0.452, + "words": [ + { + "text": "Ella,", + "start": 0.0, + "end": 1.68, + "confidence": 0.126 + }, + { + "text": "my", + "start": 1.94, + "end": 2.7, + "confidence": 0.368 + }, + { + "text": "glorious", + "start": 2.7, + "end": 3.5, + "confidence": 0.729 + }, + { + "text": "love,", + "start": 3.5, + "end": 4.18, + "confidence": 0.432 + }, + { + "text": "how", + "start": 4.94, + "end": 5.66, + "confidence": 0.693 + }, + { + "text": "are", + "start": 5.66, + "end": 6.02, + "confidence": 0.902 + }, + { + "text": "you?", + "start": 6.02, + "end": 6.28, + "confidence": 0.845 + } + ] + }, + { + "id": 1, + "seek": 0, + "start": 6.28, + "end": 9.18, + "text": " Oh, I'm okay. I will be.", + "tokens": [ + 50664, + 876, + 11, + 286, + 478, + 1392, + 13, + 286, + 486, + 312, + 13, + 50814 + ], + "temperature": 0.0, + "avg_logprob": -0.3579153639546941, + "compression_ratio": 1.425414364640884, + "no_speech_prob": 0.24429768323898315, + "confidence": 0.68, + "words": [ + { + "text": "Oh,", + "start": 6.28, + "end": 6.6, + "confidence": 0.427 + }, + { + "text": "I'm", + "start": 6.68, + "end": 7.02, + "confidence": 0.958 + }, + { + "text": "okay.", + "start": 7.02, + "end": 7.64, + "confidence": 0.605 + }, + { + "text": "I", + "start": 8.3, + "end": 8.58, + "confidence": 0.562 + }, + { + "text": "will", + "start": 8.58, + "end": 8.86, + "confidence": 0.813 + }, + { + "text": "be.", + "start": 8.86, + "end": 9.18, + "confidence": 0.871 + } + ] + }, + { + "id": 2, + "seek": 0, + "start": 9.18, + "end": 11.48, + "text": " I said she could stay with us tomorrow just until she feels better.", + "tokens": [ + 50814, + 286, + 848, + 750, + 727, + 1754, + 365, + 505, + 4153, + 445, + 1826, + 750, + 3417, + 1101, + 13, + 50964 + ], + "temperature": 0.0, + "avg_logprob": -0.3579153639546941, + "compression_ratio": 1.425414364640884, + "no_speech_prob": 0.24429768323898315, + "confidence": 0.571, + "words": [ + { + "text": "I", + "start": 9.18, + "end": 9.44, + "confidence": 0.66 + }, + { + "text": "said", + "start": 9.44, + "end": 9.62, + "confidence": 0.869 + }, + { + "text": "she", + "start": 9.62, + "end": 9.76, + "confidence": 0.748 + }, + { + "text": "could", + "start": 9.76, + "end": 9.88, + "confidence": 0.813 + }, + { + "text": "stay", + "start": 9.88, + "end": 10.08, + "confidence": 0.925 + }, + { + "text": "with", + "start": 10.08, + "end": 10.22, + "confidence": 0.808 + }, + { + "text": "us", + "start": 10.22, + "end": 10.34, + "confidence": 0.628 + }, + { + "text": "tomorrow", + "start": 10.34, + "end": 10.56, + "confidence": 0.219 + }, + { + "text": "just", + "start": 10.56, + "end": 10.74, + "confidence": 0.067 + }, + { + "text": "until", + "start": 10.74, + "end": 10.86, + "confidence": 0.4 + }, + { + "text": "she", + "start": 10.86, + "end": 10.98, + "confidence": 0.803 + }, + { + "text": "feels", + "start": 10.98, + "end": 11.18, + "confidence": 0.788 + }, + { + "text": "better.", + "start": 11.18, + "end": 11.48, + "confidence": 0.807 + } + ] + }, + { + "id": 3, + "seek": 0, + "start": 11.5, + "end": 13.34, + "text": " Of course she can.", + "tokens": [ + 50964, + 2720, + 1164, + 750, + 393, + 13, + 51014 + ], + "temperature": 0.0, + "avg_logprob": -0.3579153639546941, + "compression_ratio": 1.425414364640884, + "no_speech_prob": 0.24429768323898315, + "confidence": 0.333, + "words": [ + { + "text": "Of", + "start": 11.5, + "end": 12.1, + "confidence": 0.123 + }, + { + "text": "course", + "start": 12.1, + "end": 12.6, + "confidence": 0.86 + }, + { + "text": "she", + "start": 12.6, + "end": 12.88, + "confidence": 0.085 + }, + { + "text": "can.", + "start": 12.88, + "end": 13.34, + "confidence": 0.674 + } + ] + }, + { + "id": 4, + "seek": 0, + "start": 13.34, + "end": 15.2, + "text": " No, this won't be for long.", + "tokens": [ + 51014, + 883, + 11, + 341, + 1582, + 380, + 312, + 337, + 938, + 13, + 51114 + ], + "temperature": 0.0, + "avg_logprob": -0.3579153639546941, + "compression_ratio": 1.425414364640884, + "no_speech_prob": 0.24429768323898315, + "confidence": 0.649, + "words": [ + { + "text": "No,", + "start": 13.34, + "end": 13.78, + "confidence": 0.328 + }, + { + "text": "this", + "start": 13.9, + "end": 14.24, + "confidence": 0.419 + }, + { + "text": "won't", + "start": 14.24, + "end": 14.54, + "confidence": 0.917 + }, + { + "text": "be", + "start": 14.54, + "end": 14.68, + "confidence": 0.906 + }, + { + "text": "for", + "start": 14.68, + "end": 14.88, + "confidence": 0.884 + }, + { + "text": "long.", + "start": 14.88, + "end": 15.2, + "confidence": 0.823 + } + ] + }, + { + "id": 5, + "seek": 0, + "start": 15.2, + "end": 17.44, + "text": " Well, if you can stay as long as you want, my love.", + "tokens": [ + 51114, + 1042, + 11, + 498, + 291, + 393, + 1754, + 382, + 938, + 382, + 291, + 528, + 11, + 452, + 959, + 13, + 51214 + ], + "temperature": 0.0, + "avg_logprob": -0.3579153639546941, + "compression_ratio": 1.425414364640884, + "no_speech_prob": 0.24429768323898315, + "confidence": 0.69, + "words": [ + { + "text": "Well,", + "start": 15.2, + "end": 15.46, + "confidence": 0.553 + }, + { + "text": "if", + "start": 15.52, + "end": 15.6, + "confidence": 0.084 + }, + { + "text": "you", + "start": 15.6, + "end": 15.68, + "confidence": 0.898 + }, + { + "text": "can", + "start": 15.68, + "end": 15.8, + "confidence": 0.827 + }, + { + "text": "stay", + "start": 15.8, + "end": 16.04, + "confidence": 0.922 + }, + { + "text": "as", + "start": 16.04, + "end": 16.18, + "confidence": 0.896 + }, + { + "text": "long", + "start": 16.18, + "end": 16.32, + "confidence": 0.893 + }, + { + "text": "as", + "start": 16.32, + "end": 16.46, + "confidence": 0.902 + }, + { + "text": "you", + "start": 16.46, + "end": 16.58, + "confidence": 0.905 + }, + { + "text": "want,", + "start": 16.58, + "end": 16.76, + "confidence": 0.731 + }, + { + "text": "my", + "start": 16.88, + "end": 17.02, + "confidence": 0.901 + }, + { + "text": "love.", + "start": 17.02, + "end": 17.44, + "confidence": 0.831 + } + ] + }, + { + "id": 6, + "seek": 0, + "start": 17.44, + "end": 18.96, + "text": " I've really missed you.", + "tokens": [ + 51214, + 286, + 600, + 534, + 6721, + 291, + 13, + 51314 + ], + "temperature": 0.0, + "avg_logprob": -0.3579153639546941, + "compression_ratio": 1.425414364640884, + "no_speech_prob": 0.24429768323898315, + "confidence": 0.529, + "words": [ + { + "text": "I've", + "start": 17.44, + "end": 17.58, + "confidence": 0.309 + }, + { + "text": "really", + "start": 17.58, + "end": 18.18, + "confidence": 0.763 + }, + { + "text": "missed", + "start": 18.18, + "end": 18.68, + "confidence": 0.778 + }, + { + "text": "you.", + "start": 18.68, + "end": 18.96, + "confidence": 0.622 + } + ] + }, + { + "id": 7, + "seek": 0, + "start": 19.58, + "end": 20.12, + "text": " Pops.", + "tokens": [ + 51314, + 430, + 3370, + 13, + 51364 + ], + "temperature": 0.0, + "avg_logprob": -0.3579153639546941, + "compression_ratio": 1.425414364640884, + "no_speech_prob": 0.24429768323898315, + "confidence": 0.02, + "words": [ + { + "text": "Pops.", + "start": 19.58, + "end": 20.12, + "confidence": 0.02 + } + ] + } + ], + "language": "en" +} \ No newline at end of file diff --git a/tests/expected/corner_cases/large-v2.efficient_gloria.mp3.words.json b/tests/expected/corner_cases/large-v2.efficient_gloria.mp3.words.json new file mode 100644 index 0000000000000000000000000000000000000000..01b1c82f79a532c844d5b50fb036a4d1ce190ef2 --- /dev/null +++ b/tests/expected/corner_cases/large-v2.efficient_gloria.mp3.words.json @@ -0,0 +1,564 @@ +{ + "text": " Ella, my glorious love. How are you? Oh, I'm okay. I will be. I said she could stay with us tomorrow, just until she feels better. Of course she can. No, this won't be for long. Well, if you can stay as long as you want, my love. I really missed you. I agree.", + "segments": [ + { + "id": 0, + "seek": 0, + "start": 0.0, + "end": 4.02, + "text": " Ella, my glorious love.", + "tokens": [ + 50364, + 29261, + 11, + 452, + 24026, + 959, + 13, + 50564 + ], + "temperature": 0.0, + "avg_logprob": -0.36081909347366503, + "compression_ratio": 1.446927374301676, + "no_speech_prob": 0.244294673204422, + "confidence": 0.477, + "words": [ + { + "text": "Ella,", + "start": 0.0, + "end": 1.68, + "confidence": 0.128 + }, + { + "text": "my", + "start": 1.92, + "end": 2.1, + "confidence": 0.733 + }, + { + "text": "glorious", + "start": 2.1, + "end": 3.36, + "confidence": 0.625 + }, + { + "text": "love.", + "start": 3.36, + "end": 4.02, + "confidence": 0.883 + } + ] + }, + { + "id": 1, + "seek": 0, + "start": 5.46, + "end": 6.24, + "text": " How are you?", + "tokens": [ + 50564, + 1012, + 366, + 291, + 30, + 50664 + ], + "temperature": 0.0, + "avg_logprob": -0.36081909347366503, + "compression_ratio": 1.446927374301676, + "no_speech_prob": 0.244294673204422, + "confidence": 0.682, + "words": [ + { + "text": "How", + "start": 5.46, + "end": 5.62, + "confidence": 0.454 + }, + { + "text": "are", + "start": 5.62, + "end": 6.02, + "confidence": 0.893 + }, + { + "text": "you?", + "start": 6.02, + "end": 6.24, + "confidence": 0.783 + } + ] + }, + { + "id": 2, + "seek": 0, + "start": 6.32, + "end": 9.12, + "text": " Oh, I'm okay. I will be.", + "tokens": [ + 50664, + 876, + 11, + 286, + 478, + 1392, + 13, + 286, + 486, + 312, + 13, + 50814 + ], + "temperature": 0.0, + "avg_logprob": -0.36081909347366503, + "compression_ratio": 1.446927374301676, + "no_speech_prob": 0.244294673204422, + "confidence": 0.73, + "words": [ + { + "text": "Oh,", + "start": 6.32, + "end": 6.66, + "confidence": 0.479 + }, + { + "text": "I'm", + "start": 6.74, + "end": 7.02, + "confidence": 0.971 + }, + { + "text": "okay.", + "start": 7.02, + "end": 7.7, + "confidence": 0.476 + }, + { + "text": "I", + "start": 8.14, + "end": 8.56, + "confidence": 0.714 + }, + { + "text": "will", + "start": 8.56, + "end": 8.82, + "confidence": 0.795 + }, + { + "text": "be.", + "start": 8.82, + "end": 9.12, + "confidence": 0.906 + } + ] + }, + { + "id": 3, + "seek": 0, + "start": 9.32, + "end": 11.42, + "text": " I said she could stay with us tomorrow, just until she feels better.", + "tokens": [ + 50814, + 286, + 848, + 750, + 727, + 1754, + 365, + 505, + 4153, + 11, + 445, + 1826, + 750, + 3417, + 1101, + 13, + 50914 + ], + "temperature": 0.0, + "avg_logprob": -0.36081909347366503, + "compression_ratio": 1.446927374301676, + "no_speech_prob": 0.244294673204422, + "confidence": 0.723, + "words": [ + { + "text": "I", + "start": 9.32, + "end": 9.48, + "confidence": 0.878 + }, + { + "text": "said", + "start": 9.48, + "end": 9.62, + "confidence": 0.862 + }, + { + "text": "she", + "start": 9.62, + "end": 9.76, + "confidence": 0.762 + }, + { + "text": "could", + "start": 9.76, + "end": 9.88, + "confidence": 0.801 + }, + { + "text": "stay", + "start": 9.88, + "end": 10.08, + "confidence": 0.921 + }, + { + "text": "with", + "start": 10.08, + "end": 10.22, + "confidence": 0.812 + }, + { + "text": "us", + "start": 10.22, + "end": 10.36, + "confidence": 0.848 + }, + { + "text": "tomorrow,", + "start": 10.36, + "end": 10.56, + "confidence": 0.515 + }, + { + "text": "just", + "start": 10.74, + "end": 10.76, + "confidence": 0.433 + }, + { + "text": "until", + "start": 10.76, + "end": 10.86, + "confidence": 0.439 + }, + { + "text": "she", + "start": 10.86, + "end": 10.98, + "confidence": 0.809 + }, + { + "text": "feels", + "start": 10.98, + "end": 11.16, + "confidence": 0.777 + }, + { + "text": "better.", + "start": 11.16, + "end": 11.42, + "confidence": 0.822 + } + ] + }, + { + "id": 4, + "seek": 0, + "start": 11.9, + "end": 13.06, + "text": " Of course she can.", + "tokens": [ + 50914, + 2720, + 1164, + 750, + 393, + 13, + 51014 + ], + "temperature": 0.0, + "avg_logprob": -0.36081909347366503, + "compression_ratio": 1.446927374301676, + "no_speech_prob": 0.244294673204422, + "confidence": 0.761, + "words": [ + { + "text": "Of", + "start": 11.9, + "end": 12.16, + "confidence": 0.562 + }, + { + "text": "course", + "start": 12.16, + "end": 12.54, + "confidence": 0.875 + }, + { + "text": "she", + "start": 12.54, + "end": 12.8, + "confidence": 0.758 + }, + { + "text": "can.", + "start": 12.8, + "end": 13.06, + "confidence": 0.899 + } + ] + }, + { + "id": 5, + "seek": 0, + "start": 13.7, + "end": 15.2, + "text": " No, this won't be for long.", + "tokens": [ + 51014, + 883, + 11, + 341, + 1582, + 380, + 312, + 337, + 938, + 13, + 51114 + ], + "temperature": 0.0, + "avg_logprob": -0.36081909347366503, + "compression_ratio": 1.446927374301676, + "no_speech_prob": 0.244294673204422, + "confidence": 0.774, + "words": [ + { + "text": "No,", + "start": 13.7, + "end": 13.72, + "confidence": 0.381 + }, + { + "text": "this", + "start": 13.92, + "end": 14.26, + "confidence": 0.702 + }, + { + "text": "won't", + "start": 14.26, + "end": 14.54, + "confidence": 0.943 + }, + { + "text": "be", + "start": 14.54, + "end": 14.68, + "confidence": 0.898 + }, + { + "text": "for", + "start": 14.68, + "end": 14.86, + "confidence": 0.891 + }, + { + "text": "long.", + "start": 14.86, + "end": 15.2, + "confidence": 0.877 + } + ] + }, + { + "id": 6, + "seek": 0, + "start": 15.3, + "end": 17.48, + "text": " Well, if you can stay as long as you want, my love.", + "tokens": [ + 51114, + 1042, + 11, + 498, + 291, + 393, + 1754, + 382, + 938, + 382, + 291, + 528, + 11, + 452, + 959, + 13, + 51214 + ], + "temperature": 0.0, + "avg_logprob": -0.36081909347366503, + "compression_ratio": 1.446927374301676, + "no_speech_prob": 0.244294673204422, + "confidence": 0.836, + "words": [ + { + "text": "Well,", + "start": 15.3, + "end": 15.46, + "confidence": 0.647 + }, + { + "text": "if", + "start": 15.52, + "end": 15.6, + "confidence": 0.615 + }, + { + "text": "you", + "start": 15.6, + "end": 15.68, + "confidence": 0.896 + }, + { + "text": "can", + "start": 15.68, + "end": 15.82, + "confidence": 0.851 + }, + { + "text": "stay", + "start": 15.82, + "end": 16.04, + "confidence": 0.924 + }, + { + "text": "as", + "start": 16.04, + "end": 16.2, + "confidence": 0.885 + }, + { + "text": "long", + "start": 16.2, + "end": 16.32, + "confidence": 0.883 + }, + { + "text": "as", + "start": 16.32, + "end": 16.48, + "confidence": 0.907 + }, + { + "text": "you", + "start": 16.48, + "end": 16.58, + "confidence": 0.899 + }, + { + "text": "want,", + "start": 16.58, + "end": 16.76, + "confidence": 0.81 + }, + { + "text": "my", + "start": 16.9, + "end": 17.02, + "confidence": 0.901 + }, + { + "text": "love.", + "start": 17.02, + "end": 17.48, + "confidence": 0.896 + } + ] + }, + { + "id": 7, + "seek": 0, + "start": 17.66, + "end": 18.96, + "text": " I really missed you.", + "tokens": [ + 51214, + 286, + 534, + 6721, + 291, + 13, + 51314 + ], + "temperature": 0.0, + "avg_logprob": -0.36081909347366503, + "compression_ratio": 1.446927374301676, + "no_speech_prob": 0.244294673204422, + "confidence": 0.479, + "words": [ + { + "text": "I", + "start": 17.66, + "end": 17.86, + "confidence": 0.252 + }, + { + "text": "really", + "start": 17.86, + "end": 18.22, + "confidence": 0.447 + }, + { + "text": "missed", + "start": 18.22, + "end": 18.7, + "confidence": 0.653 + }, + { + "text": "you.", + "start": 18.7, + "end": 18.96, + "confidence": 0.717 + } + ] + }, + { + "id": 8, + "seek": 0, + "start": 19.58, + "end": 20.6, + "text": " I agree.", + "tokens": [ + 51314, + 286, + 3986, + 13, + 51414 + ], + "temperature": 0.0, + "avg_logprob": -0.36081909347366503, + "compression_ratio": 1.446927374301676, + "no_speech_prob": 0.244294673204422, + "confidence": 0.421, + "words": [ + { + "text": "I", + "start": 19.58, + "end": 20.4, + "confidence": 0.403 + }, + { + "text": "agree.", + "start": 20.4, + "end": 20.6, + "confidence": 0.439 + } + ] + } + ], + "language": "en" +} \ No newline at end of file diff --git a/tests/expected/corner_cases/large_apollo11.mp3.words.json b/tests/expected/corner_cases/large_apollo11.mp3.words.json new file mode 100644 index 0000000000000000000000000000000000000000..c3a47745197c8551a120143206ea1eebd2b93ac2 --- /dev/null +++ b/tests/expected/corner_cases/large_apollo11.mp3.words.json @@ -0,0 +1,1208 @@ +{ + "text": " Apollo 11, Houston. We got a recommendation for you on your DOJ's E-A limb, E-G-E-A's, over. Go ahead. Okay, we'd like to have, say, a selected one or two on the helmet. We're going to have an B1. And you could put the other one on Mike's helmet, we're still seeing the bleepers. Over. with a cover I tried it already. Okay fine, we weren't sure that this was a suggestion. We thought we'd uh... you could check it out. How much you've already done that. So uh... I guess whatever you can come up with, just let us know and... Okay there's no problem. Okay, there's no problem. We'll let you know where they end up. Nice.", + "segments": [ + { + "id": 0, + "seek": 0, + "start": 0.36, + "end": 6.96, + "text": " Apollo 11, Houston. We got a recommendation for you on your DOJ's E-A limb, E-G-E-A's, over.", + "tokens": [ + 50364, + 25187, + 2975, + 11, + 18717, + 13, + 492, + 658, + 257, + 11879, + 337, + 291, + 322, + 428, + 10699, + 41, + 311, + 462, + 12, + 32, + 30390, + 11, + 462, + 12, + 38, + 12, + 36, + 12, + 32, + 311, + 11, + 670, + 13, + 50714 + ], + "temperature": 0.4, + "avg_logprob": -0.6033297837382615, + "compression_ratio": 1.425, + "no_speech_prob": 0.3341304659843445, + "confidence": 0.595, + "words": [ + { + "text": "Apollo", + "start": 0.36, + "end": 0.92, + "confidence": 0.79 + }, + { + "text": "11,", + "start": 0.92, + "end": 1.32, + "confidence": 0.877 + }, + { + "text": "Houston.", + "start": 1.5, + "end": 1.74, + "confidence": 0.827 + }, + { + "text": "We", + "start": 1.9, + "end": 1.94, + "confidence": 0.836 + }, + { + "text": "got", + "start": 1.94, + "end": 2.1, + "confidence": 0.639 + }, + { + "text": "a", + "start": 2.1, + "end": 2.3, + "confidence": 0.995 + }, + { + "text": "recommendation", + "start": 2.3, + "end": 3.08, + "confidence": 0.709 + }, + { + "text": "for", + "start": 3.08, + "end": 3.46, + "confidence": 0.856 + }, + { + "text": "you", + "start": 3.46, + "end": 3.62, + "confidence": 0.859 + }, + { + "text": "on", + "start": 3.62, + "end": 3.76, + "confidence": 0.87 + }, + { + "text": "your", + "start": 3.76, + "end": 4.06, + "confidence": 0.767 + }, + { + "text": "DOJ's", + "start": 4.06, + "end": 4.88, + "confidence": 0.163 + }, + { + "text": "E-A", + "start": 4.88, + "end": 5.3, + "confidence": 0.408 + }, + { + "text": "limb,", + "start": 5.3, + "end": 5.62, + "confidence": 0.264 + }, + { + "text": "E-G-E-A's,", + "start": 5.76, + "end": 6.8, + "confidence": 0.768 + }, + { + "text": "over.", + "start": 6.82, + "end": 6.96, + "confidence": 0.817 + } + ] + }, + { + "id": 1, + "seek": 0, + "start": 10.74, + "end": 11.14, + "text": " Go ahead.", + "tokens": [ + 50864, + 1037, + 2286, + 13, + 50914 + ], + "temperature": 0.4, + "avg_logprob": -0.6033297837382615, + "compression_ratio": 1.425, + "no_speech_prob": 0.3341304659843445, + "confidence": 0.85, + "words": [ + { + "text": "Go", + "start": 10.74, + "end": 10.98, + "confidence": 0.842 + }, + { + "text": "ahead.", + "start": 10.98, + "end": 11.14, + "confidence": 0.858 + } + ] + }, + { + "id": 2, + "seek": 0, + "start": 11.88, + "end": 17.3, + "text": " Okay, we'd like to have, say, a selected one or two on the helmet.", + "tokens": [ + 50914, + 1033, + 11, + 321, + 1116, + 411, + 281, + 362, + 11, + 584, + 11, + 257, + 8209, + 472, + 420, + 732, + 322, + 264, + 15922, + 13, + 51214 + ], + "temperature": 0.4, + "avg_logprob": -0.6033297837382615, + "compression_ratio": 1.425, + "no_speech_prob": 0.3341304659843445, + "confidence": 0.428, + "words": [ + { + "text": "Okay,", + "start": 11.88, + "end": 12.28, + "confidence": 0.507 + }, + { + "text": "we'd", + "start": 12.5, + "end": 13.16, + "confidence": 0.623 + }, + { + "text": "like", + "start": 13.16, + "end": 13.32, + "confidence": 0.876 + }, + { + "text": "to", + "start": 13.32, + "end": 13.56, + "confidence": 0.737 + }, + { + "text": "have,", + "start": 13.56, + "end": 14.24, + "confidence": 0.124 + }, + { + "text": "say,", + "start": 14.74, + "end": 15.0, + "confidence": 0.153 + }, + { + "text": "a", + "start": 15.1, + "end": 15.16, + "confidence": 0.061 + }, + { + "text": "selected", + "start": 15.16, + "end": 15.76, + "confidence": 0.143 + }, + { + "text": "one", + "start": 15.76, + "end": 16.08, + "confidence": 0.754 + }, + { + "text": "or", + "start": 16.08, + "end": 16.22, + "confidence": 0.67 + }, + { + "text": "two", + "start": 16.22, + "end": 16.36, + "confidence": 0.6 + }, + { + "text": "on", + "start": 16.36, + "end": 16.6, + "confidence": 0.875 + }, + { + "text": "the", + "start": 16.6, + "end": 16.82, + "confidence": 0.809 + }, + { + "text": "helmet.", + "start": 16.82, + "end": 17.3, + "confidence": 0.651 + } + ] + }, + { + "id": 3, + "seek": 0, + "start": 17.32, + "end": 19.12, + "text": " We're going to have an B1.", + "tokens": [ + 51214, + 492, + 434, + 516, + 281, + 362, + 364, + 363, + 16, + 13, + 51314 + ], + "temperature": 0.4, + "avg_logprob": -0.6033297837382615, + "compression_ratio": 1.425, + "no_speech_prob": 0.3341304659843445, + "confidence": 0.545, + "words": [ + { + "text": "We're", + "start": 17.32, + "end": 17.78, + "confidence": 0.7 + }, + { + "text": "going", + "start": 17.78, + "end": 17.94, + "confidence": 0.505 + }, + { + "text": "to", + "start": 17.94, + "end": 18.06, + "confidence": 0.899 + }, + { + "text": "have", + "start": 18.06, + "end": 18.22, + "confidence": 0.848 + }, + { + "text": "an", + "start": 18.22, + "end": 18.4, + "confidence": 0.264 + }, + { + "text": "B1.", + "start": 18.4, + "end": 19.12, + "confidence": 0.395 + } + ] + }, + { + "id": 4, + "seek": 0, + "start": 20.08, + "end": 24.32, + "text": " And you could put the other one on Mike's helmet, we're still seeing the bleepers.", + "tokens": [ + 51314, + 400, + 291, + 727, + 829, + 264, + 661, + 472, + 322, + 6602, + 311, + 15922, + 11, + 321, + 434, + 920, + 2577, + 264, + 5408, + 595, + 433, + 13, + 51564 + ], + "temperature": 0.4, + "avg_logprob": -0.6033297837382615, + "compression_ratio": 1.425, + "no_speech_prob": 0.3341304659843445, + "confidence": 0.528, + "words": [ + { + "text": "And", + "start": 20.08, + "end": 20.22, + "confidence": 0.796 + }, + { + "text": "you", + "start": 20.22, + "end": 20.34, + "confidence": 0.885 + }, + { + "text": "could", + "start": 20.34, + "end": 20.48, + "confidence": 0.415 + }, + { + "text": "put", + "start": 20.48, + "end": 20.66, + "confidence": 0.894 + }, + { + "text": "the", + "start": 20.66, + "end": 20.84, + "confidence": 0.813 + }, + { + "text": "other", + "start": 20.84, + "end": 21.02, + "confidence": 0.774 + }, + { + "text": "one", + "start": 21.02, + "end": 21.22, + "confidence": 0.779 + }, + { + "text": "on", + "start": 21.22, + "end": 21.46, + "confidence": 0.906 + }, + { + "text": "Mike's", + "start": 21.46, + "end": 22.72, + "confidence": 0.831 + }, + { + "text": "helmet,", + "start": 22.72, + "end": 22.86, + "confidence": 0.791 + }, + { + "text": "we're", + "start": 23.06, + "end": 23.14, + "confidence": 0.354 + }, + { + "text": "still", + "start": 23.14, + "end": 23.34, + "confidence": 0.792 + }, + { + "text": "seeing", + "start": 23.34, + "end": 23.64, + "confidence": 0.728 + }, + { + "text": "the", + "start": 23.64, + "end": 23.88, + "confidence": 0.099 + }, + { + "text": "bleepers.", + "start": 23.88, + "end": 24.32, + "confidence": 0.228 + } + ] + }, + { + "id": 5, + "seek": 0, + "start": 24.86, + "end": 25.1, + "text": " Over.", + "tokens": [ + 51564, + 4886, + 13, + 51614 + ], + "temperature": 0.4, + "avg_logprob": -0.6033297837382615, + "compression_ratio": 1.425, + "no_speech_prob": 0.3341304659843445, + "confidence": 0.616, + "words": [ + { + "text": "Over.", + "start": 24.86, + "end": 25.1, + "confidence": 0.616 + } + ] + }, + { + "id": 6, + "seek": 6000, + "start": 60.0, + "end": 61.9, + "text": " with a cover I tried it already.", + "tokens": [ + 50364, + 365, + 257, + 2060, + 286, + 3031, + 309, + 1217, + 13, + 50474 + ], + "temperature": 0.4, + "avg_logprob": -0.6061306174741973, + "compression_ratio": 1.5876777251184835, + "no_speech_prob": 0.0662694051861763, + "confidence": 0.442, + "words": [ + { + "text": "with", + "start": 60.0, + "end": 60.2, + "confidence": 0.119 + }, + { + "text": "a", + "start": 60.2, + "end": 60.38, + "confidence": 0.457 + }, + { + "text": "cover", + "start": 60.38, + "end": 61.04, + "confidence": 0.558 + }, + { + "text": "I", + "start": 61.04, + "end": 61.22, + "confidence": 0.278 + }, + { + "text": "tried", + "start": 61.22, + "end": 61.48, + "confidence": 0.625 + }, + { + "text": "it", + "start": 61.48, + "end": 61.64, + "confidence": 0.802 + }, + { + "text": "already.", + "start": 61.64, + "end": 61.9, + "confidence": 0.772 + } + ] + }, + { + "id": 7, + "seek": 6000, + "start": 62.42, + "end": 65.18, + "text": " Okay fine, we weren't sure that this was a suggestion.", + "tokens": [ + 50474, + 1033, + 2489, + 11, + 321, + 4999, + 380, + 988, + 300, + 341, + 390, + 257, + 16541, + 13, + 50629 + ], + "temperature": 0.4, + "avg_logprob": -0.6061306174741973, + "compression_ratio": 1.5876777251184835, + "no_speech_prob": 0.0662694051861763, + "confidence": 0.666, + "words": [ + { + "text": "Okay", + "start": 62.42, + "end": 62.82, + "confidence": 0.414 + }, + { + "text": "fine,", + "start": 62.82, + "end": 63.1, + "confidence": 0.467 + }, + { + "text": "we", + "start": 63.22, + "end": 63.3, + "confidence": 0.846 + }, + { + "text": "weren't", + "start": 63.3, + "end": 63.56, + "confidence": 0.886 + }, + { + "text": "sure", + "start": 63.56, + "end": 63.74, + "confidence": 0.809 + }, + { + "text": "that", + "start": 63.74, + "end": 64.1, + "confidence": 0.513 + }, + { + "text": "this", + "start": 64.1, + "end": 64.58, + "confidence": 0.59 + }, + { + "text": "was", + "start": 64.58, + "end": 64.76, + "confidence": 0.787 + }, + { + "text": "a", + "start": 64.76, + "end": 64.88, + "confidence": 0.769 + }, + { + "text": "suggestion.", + "start": 64.88, + "end": 65.18, + "confidence": 0.605 + } + ] + }, + { + "id": 8, + "seek": 6000, + "start": 65.22, + "end": 66.76, + "text": " We thought we'd uh...", + "tokens": [ + 50629, + 492, + 1194, + 321, + 1116, + 2232, + 485, + 50699 + ], + "temperature": 0.4, + "avg_logprob": -0.6061306174741973, + "compression_ratio": 1.5876777251184835, + "no_speech_prob": 0.0662694051861763, + "confidence": 0.604, + "words": [ + { + "text": "We", + "start": 65.22, + "end": 65.4, + "confidence": 0.876 + }, + { + "text": "thought", + "start": 65.4, + "end": 65.56, + "confidence": 0.816 + }, + { + "text": "we'd", + "start": 65.56, + "end": 65.88, + "confidence": 0.561 + }, + { + "text": "uh...", + "start": 65.88, + "end": 66.76, + "confidence": 0.356 + } + ] + }, + { + "id": 9, + "seek": 6000, + "start": 66.76, + "end": 67.82, + "text": " you could check it out.", + "tokens": [ + 50699, + 291, + 727, + 1520, + 309, + 484, + 13, + 50769 + ], + "temperature": 0.4, + "avg_logprob": -0.6061306174741973, + "compression_ratio": 1.5876777251184835, + "no_speech_prob": 0.0662694051861763, + "confidence": 0.599, + "words": [ + { + "text": "you", + "start": 66.76, + "end": 67.04, + "confidence": 0.191 + }, + { + "text": "could", + "start": 67.04, + "end": 67.22, + "confidence": 0.698 + }, + { + "text": "check", + "start": 67.22, + "end": 67.44, + "confidence": 0.792 + }, + { + "text": "it", + "start": 67.44, + "end": 67.58, + "confidence": 0.901 + }, + { + "text": "out.", + "start": 67.58, + "end": 67.82, + "confidence": 0.811 + } + ] + }, + { + "id": 10, + "seek": 6000, + "start": 68.18, + "end": 69.3, + "text": " How much you've already done that.", + "tokens": [ + 50769, + 1012, + 709, + 291, + 600, + 1217, + 1096, + 300, + 13, + 50834 + ], + "temperature": 0.4, + "avg_logprob": -0.6061306174741973, + "compression_ratio": 1.5876777251184835, + "no_speech_prob": 0.0662694051861763, + "confidence": 0.617, + "words": [ + { + "text": "How", + "start": 68.18, + "end": 68.42, + "confidence": 0.234 + }, + { + "text": "much", + "start": 68.42, + "end": 68.6, + "confidence": 0.806 + }, + { + "text": "you've", + "start": 68.6, + "end": 68.76, + "confidence": 0.575 + }, + { + "text": "already", + "start": 68.76, + "end": 68.88, + "confidence": 0.814 + }, + { + "text": "done", + "start": 68.88, + "end": 69.1, + "confidence": 0.779 + }, + { + "text": "that.", + "start": 69.1, + "end": 69.3, + "confidence": 0.861 + } + ] + }, + { + "id": 11, + "seek": 6000, + "start": 69.36, + "end": 70.26, + "text": " So uh...", + "tokens": [ + 50834, + 407, + 2232, + 485, + 50879 + ], + "temperature": 0.4, + "avg_logprob": -0.6061306174741973, + "compression_ratio": 1.5876777251184835, + "no_speech_prob": 0.0662694051861763, + "confidence": 0.644, + "words": [ + { + "text": "So", + "start": 69.36, + "end": 69.66, + "confidence": 0.883 + }, + { + "text": "uh...", + "start": 69.66, + "end": 70.26, + "confidence": 0.469 + } + ] + }, + { + "id": 12, + "seek": 6000, + "start": 70.32, + "end": 71.8, + "text": " I guess whatever you can come up with,", + "tokens": [ + 50879, + 286, + 2041, + 2035, + 291, + 393, + 808, + 493, + 365, + 11, + 50954 + ], + "temperature": 0.4, + "avg_logprob": -0.6061306174741973, + "compression_ratio": 1.5876777251184835, + "no_speech_prob": 0.0662694051861763, + "confidence": 0.632, + "words": [ + { + "text": "I", + "start": 70.32, + "end": 70.5, + "confidence": 0.992 + }, + { + "text": "guess", + "start": 70.5, + "end": 70.7, + "confidence": 0.905 + }, + { + "text": "whatever", + "start": 70.7, + "end": 71.12, + "confidence": 0.201 + }, + { + "text": "you", + "start": 71.12, + "end": 71.26, + "confidence": 0.884 + }, + { + "text": "can", + "start": 71.26, + "end": 71.32, + "confidence": 0.281 + }, + { + "text": "come", + "start": 71.32, + "end": 71.46, + "confidence": 0.777 + }, + { + "text": "up", + "start": 71.46, + "end": 71.62, + "confidence": 0.898 + }, + { + "text": "with,", + "start": 71.62, + "end": 71.8, + "confidence": 0.817 + } + ] + }, + { + "id": 13, + "seek": 6000, + "start": 71.8, + "end": 72.76, + "text": " just let us know and...", + "tokens": [ + 50954, + 445, + 718, + 505, + 458, + 293, + 485, + 51004 + ], + "temperature": 0.4, + "avg_logprob": -0.6061306174741973, + "compression_ratio": 1.5876777251184835, + "no_speech_prob": 0.0662694051861763, + "confidence": 0.721, + "words": [ + { + "text": "just", + "start": 71.8, + "end": 71.98, + "confidence": 0.866 + }, + { + "text": "let", + "start": 71.98, + "end": 72.12, + "confidence": 0.905 + }, + { + "text": "us", + "start": 72.12, + "end": 72.26, + "confidence": 0.904 + }, + { + "text": "know", + "start": 72.26, + "end": 72.42, + "confidence": 0.798 + }, + { + "text": "and...", + "start": 72.42, + "end": 72.76, + "confidence": 0.346 + } + ] + }, + { + "id": 14, + "seek": 6000, + "start": 74.16, + "end": 75.24, + "text": " Okay there's no problem.", + "tokens": [ + 51004, + 1033, + 456, + 311, + 572, + 1154, + 13, + 51129 + ], + "temperature": 0.4, + "avg_logprob": -0.6061306174741973, + "compression_ratio": 1.5876777251184835, + "no_speech_prob": 0.0662694051861763, + "confidence": 0.558, + "words": [ + { + "text": "Okay", + "start": 74.16, + "end": 74.44, + "confidence": 0.335 + }, + { + "text": "there's", + "start": 74.44, + "end": 74.74, + "confidence": 0.486 + }, + { + "text": "no", + "start": 74.74, + "end": 74.88, + "confidence": 0.888 + }, + { + "text": "problem.", + "start": 74.88, + "end": 75.24, + "confidence": 0.771 + } + ] + }, + { + "id": 15, + "seek": 6000, + "start": 75.32, + "end": 76.56, + "text": " Okay, there's no problem.", + "tokens": [ + 51129, + 1033, + 11, + 456, + 311, + 572, + 1154, + 13, + 51194 + ], + "temperature": 0.4, + "avg_logprob": -0.6061306174741973, + "compression_ratio": 1.5876777251184835, + "no_speech_prob": 0.0662694051861763, + "confidence": 0.777, + "words": [ + { + "text": "Okay,", + "start": 75.32, + "end": 75.84, + "confidence": 0.784 + }, + { + "text": "there's", + "start": 76.0, + "end": 76.08, + "confidence": 0.712 + }, + { + "text": "no", + "start": 76.08, + "end": 76.22, + "confidence": 0.898 + }, + { + "text": "problem.", + "start": 76.22, + "end": 76.56, + "confidence": 0.793 + } + ] + }, + { + "id": 16, + "seek": 6000, + "start": 76.6, + "end": 77.8, + "text": " We'll let you know where they end up.", + "tokens": [ + 51194, + 492, + 603, + 718, + 291, + 458, + 689, + 436, + 917, + 493, + 13, + 51259 + ], + "temperature": 0.4, + "avg_logprob": -0.6061306174741973, + "compression_ratio": 1.5876777251184835, + "no_speech_prob": 0.0662694051861763, + "confidence": 0.723, + "words": [ + { + "text": "We'll", + "start": 76.6, + "end": 76.82, + "confidence": 0.834 + }, + { + "text": "let", + "start": 76.82, + "end": 76.96, + "confidence": 0.885 + }, + { + "text": "you", + "start": 76.96, + "end": 77.04, + "confidence": 0.764 + }, + { + "text": "know", + "start": 77.04, + "end": 77.2, + "confidence": 0.815 + }, + { + "text": "where", + "start": 77.2, + "end": 77.32, + "confidence": 0.6 + }, + { + "text": "they", + "start": 77.32, + "end": 77.42, + "confidence": 0.33 + }, + { + "text": "end", + "start": 77.42, + "end": 77.54, + "confidence": 0.787 + }, + { + "text": "up.", + "start": 77.54, + "end": 77.8, + "confidence": 0.905 + } + ] + }, + { + "id": 17, + "seek": 6000, + "start": 77.94, + "end": 78.32, + "text": " Nice.", + "tokens": [ + 51259, + 5490, + 13, + 51299 + ], + "temperature": 0.4, + "avg_logprob": -0.6061306174741973, + "compression_ratio": 1.5876777251184835, + "no_speech_prob": 0.0662694051861763, + "confidence": 0.495, + "words": [ + { + "text": "Nice.", + "start": 77.94, + "end": 78.32, + "confidence": 0.495 + } + ] + } + ], + "language": "en" +} \ No newline at end of file diff --git a/tests/expected/corner_cases/medium.accurate_gloria.mp3.words.json b/tests/expected/corner_cases/medium.accurate_gloria.mp3.words.json new file mode 100644 index 0000000000000000000000000000000000000000..afa758f8da5b91ba2d7cb5705d796df78040207f --- /dev/null +++ b/tests/expected/corner_cases/medium.accurate_gloria.mp3.words.json @@ -0,0 +1,544 @@ +{ + "text": " Hello. How are you? How are you? Oh, I'm okay. I will be. I said she could stay with us tomorrow until she feels better. Of course she can. This won't be for long. Well, you can stay as long as you want, my love. I really miss you.", + "segments": [ + { + "id": 0, + "seek": 0, + "start": 1.32, + "end": 1.82, + "text": " Hello.", + "tokens": [ + 50364, + 2425, + 13, + 50464 + ], + "temperature": 0.0, + "avg_logprob": -0.21371329812442555, + "compression_ratio": 1.4713375796178343, + "no_speech_prob": 0.050164904445409775, + "confidence": 0.189, + "words": [ + { + "text": "Hello.", + "start": 1.32, + "end": 1.82, + "confidence": 0.189 + } + ] + }, + { + "id": 1, + "seek": 0, + "start": 1.94, + "end": 3.54, + "text": " How are you?", + "tokens": [ + 50464, + 1012, + 366, + 291, + 30, + 50564 + ], + "temperature": 0.0, + "avg_logprob": -0.21371329812442555, + "compression_ratio": 1.4713375796178343, + "no_speech_prob": 0.050164904445409775, + "confidence": 0.157, + "words": [ + { + "text": "How", + "start": 1.94, + "end": 2.6, + "confidence": 0.004 + }, + { + "text": "are", + "start": 2.6, + "end": 3.1, + "confidence": 0.238 + }, + { + "text": "you?", + "start": 3.1, + "end": 3.54, + "confidence": 0.809 + } + ] + }, + { + "id": 2, + "seek": 0, + "start": 3.7, + "end": 6.38, + "text": " How are you?", + "tokens": [ + 50564, + 1012, + 366, + 291, + 30, + 50664 + ], + "temperature": 0.0, + "avg_logprob": -0.21371329812442555, + "compression_ratio": 1.4713375796178343, + "no_speech_prob": 0.050164904445409775, + "confidence": 0.353, + "words": [ + { + "text": "How", + "start": 3.7, + "end": 4.3, + "confidence": 0.021 + }, + { + "text": "are", + "start": 4.3, + "end": 6.12, + "confidence": 0.93 + }, + { + "text": "you?", + "start": 6.12, + "end": 6.38, + "confidence": 0.897 + } + ] + }, + { + "id": 3, + "seek": 0, + "start": 6.38, + "end": 7.74, + "text": " Oh, I'm okay.", + "tokens": [ + 50664, + 876, + 11, + 286, + 478, + 1392, + 13, + 50764 + ], + "temperature": 0.0, + "avg_logprob": -0.21371329812442555, + "compression_ratio": 1.4713375796178343, + "no_speech_prob": 0.050164904445409775, + "confidence": 0.63, + "words": [ + { + "text": "Oh,", + "start": 6.38, + "end": 6.66, + "confidence": 0.37 + }, + { + "text": "I'm", + "start": 6.76, + "end": 7.18, + "confidence": 0.979 + }, + { + "text": "okay.", + "start": 7.18, + "end": 7.74, + "confidence": 0.692 + } + ] + }, + { + "id": 4, + "seek": 0, + "start": 7.74, + "end": 9.2, + "text": " I will be.", + "tokens": [ + 50764, + 286, + 486, + 312, + 13, + 50864 + ], + "temperature": 0.0, + "avg_logprob": -0.21371329812442555, + "compression_ratio": 1.4713375796178343, + "no_speech_prob": 0.050164904445409775, + "confidence": 0.543, + "words": [ + { + "text": "I", + "start": 7.74, + "end": 8.64, + "confidence": 0.467 + }, + { + "text": "will", + "start": 8.64, + "end": 8.88, + "confidence": 0.582 + }, + { + "text": "be.", + "start": 8.88, + "end": 9.2, + "confidence": 0.565 + } + ] + }, + { + "id": 5, + "seek": 0, + "start": 9.5, + "end": 11.56, + "text": " I said she could stay with us tomorrow until she feels better.", + "tokens": [ + 50864, + 286, + 848, + 750, + 727, + 1754, + 365, + 505, + 4153, + 1826, + 750, + 3417, + 1101, + 13, + 50964 + ], + "temperature": 0.0, + "avg_logprob": -0.21371329812442555, + "compression_ratio": 1.4713375796178343, + "no_speech_prob": 0.050164904445409775, + "confidence": 0.494, + "words": [ + { + "text": "I", + "start": 9.5, + "end": 9.52, + "confidence": 0.283 + }, + { + "text": "said", + "start": 9.52, + "end": 9.64, + "confidence": 0.561 + }, + { + "text": "she", + "start": 9.64, + "end": 9.78, + "confidence": 0.919 + }, + { + "text": "could", + "start": 9.78, + "end": 9.98, + "confidence": 0.898 + }, + { + "text": "stay", + "start": 9.98, + "end": 10.16, + "confidence": 0.993 + }, + { + "text": "with", + "start": 10.16, + "end": 10.28, + "confidence": 0.991 + }, + { + "text": "us", + "start": 10.28, + "end": 10.46, + "confidence": 0.966 + }, + { + "text": "tomorrow", + "start": 10.46, + "end": 10.68, + "confidence": 0.004 + }, + { + "text": "until", + "start": 10.68, + "end": 10.84, + "confidence": 0.312 + }, + { + "text": "she", + "start": 10.84, + "end": 10.98, + "confidence": 0.997 + }, + { + "text": "feels", + "start": 10.98, + "end": 11.2, + "confidence": 0.988 + }, + { + "text": "better.", + "start": 11.2, + "end": 11.56, + "confidence": 0.825 + } + ] + }, + { + "id": 6, + "seek": 0, + "start": 11.56, + "end": 13.42, + "text": " Of course she can.", + "tokens": [ + 50964, + 2720, + 1164, + 750, + 393, + 13, + 51064 + ], + "temperature": 0.0, + "avg_logprob": -0.21371329812442555, + "compression_ratio": 1.4713375796178343, + "no_speech_prob": 0.050164904445409775, + "confidence": 0.31, + "words": [ + { + "text": "Of", + "start": 11.56, + "end": 12.54, + "confidence": 0.09 + }, + { + "text": "course", + "start": 12.54, + "end": 12.72, + "confidence": 0.985 + }, + { + "text": "she", + "start": 12.72, + "end": 13.04, + "confidence": 0.208 + }, + { + "text": "can.", + "start": 13.04, + "end": 13.42, + "confidence": 0.392 + } + ] + }, + { + "id": 7, + "seek": 0, + "start": 13.54, + "end": 15.24, + "text": " This won't be for long.", + "tokens": [ + 51064, + 639, + 1582, + 380, + 312, + 337, + 938, + 13, + 51164 + ], + "temperature": 0.0, + "avg_logprob": -0.21371329812442555, + "compression_ratio": 1.4713375796178343, + "no_speech_prob": 0.050164904445409775, + "confidence": 0.444, + "words": [ + { + "text": "This", + "start": 13.54, + "end": 14.16, + "confidence": 0.007 + }, + { + "text": "won't", + "start": 14.16, + "end": 14.58, + "confidence": 0.926 + }, + { + "text": "be", + "start": 14.58, + "end": 14.8, + "confidence": 0.99 + }, + { + "text": "for", + "start": 14.8, + "end": 14.98, + "confidence": 0.978 + }, + { + "text": "long.", + "start": 14.98, + "end": 15.24, + "confidence": 0.764 + } + ] + }, + { + "id": 8, + "seek": 0, + "start": 15.5, + "end": 17.62, + "text": " Well, you can stay as long as you want, my love.", + "tokens": [ + 51164, + 1042, + 11, + 291, + 393, + 1754, + 382, + 938, + 382, + 291, + 528, + 11, + 452, + 959, + 13, + 51264 + ], + "temperature": 0.0, + "avg_logprob": -0.21371329812442555, + "compression_ratio": 1.4713375796178343, + "no_speech_prob": 0.050164904445409775, + "confidence": 0.587, + "words": [ + { + "text": "Well,", + "start": 15.5, + "end": 15.52, + "confidence": 0.073 + }, + { + "text": "you", + "start": 15.52, + "end": 15.66, + "confidence": 0.491 + }, + { + "text": "can", + "start": 15.66, + "end": 15.88, + "confidence": 0.876 + }, + { + "text": "stay", + "start": 15.88, + "end": 16.12, + "confidence": 0.932 + }, + { + "text": "as", + "start": 16.12, + "end": 16.28, + "confidence": 0.979 + }, + { + "text": "long", + "start": 16.28, + "end": 16.4, + "confidence": 0.995 + }, + { + "text": "as", + "start": 16.4, + "end": 16.54, + "confidence": 0.995 + }, + { + "text": "you", + "start": 16.54, + "end": 16.62, + "confidence": 0.995 + }, + { + "text": "want,", + "start": 16.62, + "end": 16.8, + "confidence": 0.643 + }, + { + "text": "my", + "start": 16.98, + "end": 17.2, + "confidence": 0.958 + }, + { + "text": "love.", + "start": 17.2, + "end": 17.62, + "confidence": 0.835 + } + ] + }, + { + "id": 9, + "seek": 0, + "start": 17.62, + "end": 19.52, + "text": " I really miss you.", + "tokens": [ + 51264, + 286, + 534, + 1713, + 291, + 13, + 51364 + ], + "temperature": 0.0, + "avg_logprob": -0.21371329812442555, + "compression_ratio": 1.4713375796178343, + "no_speech_prob": 0.050164904445409775, + "confidence": 0.477, + "words": [ + { + "text": "I", + "start": 17.62, + "end": 17.94, + "confidence": 0.495 + }, + { + "text": "really", + "start": 17.94, + "end": 18.3, + "confidence": 0.89 + }, + { + "text": "miss", + "start": 18.3, + "end": 18.78, + "confidence": 0.338 + }, + { + "text": "you.", + "start": 18.78, + "end": 19.52, + "confidence": 0.408 + } + ] + } + ], + "language": "en" +} \ No newline at end of file diff --git a/tests/expected/corner_cases/medium.efficient_gloria.mp3.words.json b/tests/expected/corner_cases/medium.efficient_gloria.mp3.words.json new file mode 100644 index 0000000000000000000000000000000000000000..439728f2cd4ff2aadde1461f93aefbddeff1861a --- /dev/null +++ b/tests/expected/corner_cases/medium.efficient_gloria.mp3.words.json @@ -0,0 +1,538 @@ +{ + "text": " Hello. How are you? Love. How are you? I'm okay. I will be. I said she could stay with us tomorrow, she feels better. Of course she can. This won't be for long. Well, you can stay as long as you want, my love. I really miss you.", + "segments": [ + { + "id": 0, + "seek": 0, + "start": 1.4, + "end": 1.74, + "text": " Hello.", + "tokens": [ + 50364, + 2425, + 13, + 50464 + ], + "temperature": 0.0, + "avg_logprob": -0.23879062428193934, + "compression_ratio": 1.4615384615384615, + "no_speech_prob": 0.05016394704580307, + "confidence": 0.285, + "words": [ + { + "text": "Hello.", + "start": 1.4, + "end": 1.74, + "confidence": 0.285 + } + ] + }, + { + "id": 1, + "seek": 0, + "start": 2.32, + "end": 3.5, + "text": " How are you?", + "tokens": [ + 50464, + 1012, + 366, + 291, + 30, + 50564 + ], + "temperature": 0.0, + "avg_logprob": -0.23879062428193934, + "compression_ratio": 1.4615384615384615, + "no_speech_prob": 0.05016394704580307, + "confidence": 0.786, + "words": [ + { + "text": "How", + "start": 2.32, + "end": 2.82, + "confidence": 0.551 + }, + { + "text": "are", + "start": 2.82, + "end": 3.24, + "confidence": 0.989 + }, + { + "text": "you?", + "start": 3.24, + "end": 3.5, + "confidence": 0.893 + } + ] + }, + { + "id": 2, + "seek": 0, + "start": 3.5, + "end": 4.26, + "text": " Love.", + "tokens": [ + 50564, + 5956, + 13, + 50664 + ], + "temperature": 0.0, + "avg_logprob": -0.23879062428193934, + "compression_ratio": 1.4615384615384615, + "no_speech_prob": 0.05016394704580307, + "confidence": 0.244, + "words": [ + { + "text": "Love.", + "start": 3.5, + "end": 4.26, + "confidence": 0.244 + } + ] + }, + { + "id": 3, + "seek": 0, + "start": 5.5, + "end": 6.38, + "text": " How are you?", + "tokens": [ + 50664, + 1012, + 366, + 291, + 30, + 50764 + ], + "temperature": 0.0, + "avg_logprob": -0.23879062428193934, + "compression_ratio": 1.4615384615384615, + "no_speech_prob": 0.05016394704580307, + "confidence": 0.926, + "words": [ + { + "text": "How", + "start": 5.5, + "end": 5.68, + "confidence": 0.851 + }, + { + "text": "are", + "start": 5.68, + "end": 6.08, + "confidence": 0.998 + }, + { + "text": "you?", + "start": 6.08, + "end": 6.38, + "confidence": 0.935 + } + ] + }, + { + "id": 4, + "seek": 0, + "start": 7.5, + "end": 9.18, + "text": " I'm okay. I will be.", + "tokens": [ + 50764, + 286, + 478, + 1392, + 13, + 286, + 486, + 312, + 13, + 50864 + ], + "temperature": 0.0, + "avg_logprob": -0.23879062428193934, + "compression_ratio": 1.4615384615384615, + "no_speech_prob": 0.05016394704580307, + "confidence": 0.77, + "words": [ + { + "text": "I'm", + "start": 7.5, + "end": 7.52, + "confidence": 0.767 + }, + { + "text": "okay.", + "start": 7.52, + "end": 8.22, + "confidence": 0.488 + }, + { + "text": "I", + "start": 8.42, + "end": 8.64, + "confidence": 0.767 + }, + { + "text": "will", + "start": 8.64, + "end": 8.94, + "confidence": 0.949 + }, + { + "text": "be.", + "start": 8.94, + "end": 9.18, + "confidence": 0.997 + } + ] + }, + { + "id": 5, + "seek": 0, + "start": 9.5, + "end": 11.52, + "text": " I said she could stay with us tomorrow, she feels better.", + "tokens": [ + 50864, + 286, + 848, + 750, + 727, + 1754, + 365, + 505, + 4153, + 11, + 750, + 3417, + 1101, + 13, + 50964 + ], + "temperature": 0.0, + "avg_logprob": -0.23879062428193934, + "compression_ratio": 1.4615384615384615, + "no_speech_prob": 0.05016394704580307, + "confidence": 0.786, + "words": [ + { + "text": "I", + "start": 9.5, + "end": 9.52, + "confidence": 0.883 + }, + { + "text": "said", + "start": 9.52, + "end": 9.64, + "confidence": 0.856 + }, + { + "text": "she", + "start": 9.64, + "end": 9.78, + "confidence": 0.928 + }, + { + "text": "could", + "start": 9.78, + "end": 9.96, + "confidence": 0.909 + }, + { + "text": "stay", + "start": 9.96, + "end": 10.16, + "confidence": 0.994 + }, + { + "text": "with", + "start": 10.16, + "end": 10.28, + "confidence": 0.977 + }, + { + "text": "us", + "start": 10.28, + "end": 10.46, + "confidence": 0.993 + }, + { + "text": "tomorrow,", + "start": 10.46, + "end": 10.66, + "confidence": 0.514 + }, + { + "text": "she", + "start": 10.72, + "end": 10.86, + "confidence": 0.279 + }, + { + "text": "feels", + "start": 10.86, + "end": 11.16, + "confidence": 0.809 + }, + { + "text": "better.", + "start": 11.16, + "end": 11.52, + "confidence": 0.992 + } + ] + }, + { + "id": 6, + "seek": 0, + "start": 12.06, + "end": 13.36, + "text": " Of course she can.", + "tokens": [ + 50964, + 2720, + 1164, + 750, + 393, + 13, + 51064 + ], + "temperature": 0.0, + "avg_logprob": -0.23879062428193934, + "compression_ratio": 1.4615384615384615, + "no_speech_prob": 0.05016394704580307, + "confidence": 0.928, + "words": [ + { + "text": "Of", + "start": 12.06, + "end": 12.34, + "confidence": 0.788 + }, + { + "text": "course", + "start": 12.34, + "end": 12.56, + "confidence": 0.989 + }, + { + "text": "she", + "start": 12.56, + "end": 12.88, + "confidence": 0.958 + }, + { + "text": "can.", + "start": 12.88, + "end": 13.36, + "confidence": 0.993 + } + ] + }, + { + "id": 7, + "seek": 0, + "start": 13.5, + "end": 15.26, + "text": " This won't be for long.", + "tokens": [ + 51064, + 639, + 1582, + 380, + 312, + 337, + 938, + 13, + 51164 + ], + "temperature": 0.0, + "avg_logprob": -0.23879062428193934, + "compression_ratio": 1.4615384615384615, + "no_speech_prob": 0.05016394704580307, + "confidence": 0.892, + "words": [ + { + "text": "This", + "start": 13.5, + "end": 14.28, + "confidence": 0.543 + }, + { + "text": "won't", + "start": 14.28, + "end": 14.6, + "confidence": 0.975 + }, + { + "text": "be", + "start": 14.6, + "end": 14.8, + "confidence": 0.996 + }, + { + "text": "for", + "start": 14.8, + "end": 14.96, + "confidence": 0.984 + }, + { + "text": "long.", + "start": 14.96, + "end": 15.26, + "confidence": 0.996 + } + ] + }, + { + "id": 8, + "seek": 0, + "start": 15.5, + "end": 17.62, + "text": " Well, you can stay as long as you want, my love.", + "tokens": [ + 51164, + 1042, + 11, + 291, + 393, + 1754, + 382, + 938, + 382, + 291, + 528, + 11, + 452, + 959, + 13, + 51264 + ], + "temperature": 0.0, + "avg_logprob": -0.23879062428193934, + "compression_ratio": 1.4615384615384615, + "no_speech_prob": 0.05016394704580307, + "confidence": 0.927, + "words": [ + { + "text": "Well,", + "start": 15.5, + "end": 15.56, + "confidence": 0.675 + }, + { + "text": "you", + "start": 15.68, + "end": 15.7, + "confidence": 0.744 + }, + { + "text": "can", + "start": 15.7, + "end": 15.94, + "confidence": 0.982 + }, + { + "text": "stay", + "start": 15.94, + "end": 16.14, + "confidence": 0.985 + }, + { + "text": "as", + "start": 16.14, + "end": 16.28, + "confidence": 0.972 + }, + { + "text": "long", + "start": 16.28, + "end": 16.4, + "confidence": 0.994 + }, + { + "text": "as", + "start": 16.4, + "end": 16.48, + "confidence": 0.996 + }, + { + "text": "you", + "start": 16.48, + "end": 16.62, + "confidence": 0.995 + }, + { + "text": "want,", + "start": 16.62, + "end": 16.8, + "confidence": 0.995 + }, + { + "text": "my", + "start": 16.88, + "end": 17.22, + "confidence": 0.95 + }, + { + "text": "love.", + "start": 17.22, + "end": 17.62, + "confidence": 0.993 + } + ] + }, + { + "id": 9, + "seek": 0, + "start": 17.76, + "end": 19.26, + "text": " I really miss you.", + "tokens": [ + 51264, + 286, + 534, + 1713, + 291, + 13, + 51364 + ], + "temperature": 0.0, + "avg_logprob": -0.23879062428193934, + "compression_ratio": 1.4615384615384615, + "no_speech_prob": 0.05016394704580307, + "confidence": 0.792, + "words": [ + { + "text": "I", + "start": 17.76, + "end": 17.98, + "confidence": 0.587 + }, + { + "text": "really", + "start": 17.98, + "end": 18.36, + "confidence": 0.944 + }, + { + "text": "miss", + "start": 18.36, + "end": 18.78, + "confidence": 0.905 + }, + { + "text": "you.", + "start": 18.78, + "end": 19.26, + "confidence": 0.787 + } + ] + } + ], + "language": "en" +} \ No newline at end of file diff --git a/tests/expected/corner_cases/nocond.random_music.mp4.words.json b/tests/expected/corner_cases/nocond.random_music.mp4.words.json new file mode 100644 index 0000000000000000000000000000000000000000..f06d275035a63608dd63d45f0e1f4a80d5424924 --- /dev/null +++ b/tests/expected/corner_cases/nocond.random_music.mp4.words.json @@ -0,0 +1,2847 @@ +{ + "text": " I As you're praying for my phone And the laughter in the holes And the names that I've been called I stack it in my mind And I'm waiting for the time When I show you what it's like To be worse than in a mine Tell you, you're the greatest But once you turn they hate us Oh, the misery Everybody wants to be my enemy I smell the sympathy Everybody wants to be my enemy Look out for yourself My enemy Look out for yourself Look, okay, I'm Hoping that somebody pray for me I'm praying that somebody vote for me I'm staying where nobody's supposed to be I propose to be in a wreck of emotions Ready to go whenever she let me know The road is long so put the pedal into the flow The enemy on my trail, my energy unavailable I'ma tell the master the way go Hey, when I'm flat on my track to the top I been out of shape, thinking that I'm a box of an astronaut Blasted off the planet, rocked the cars, catastrophic And it matters more because I had it, now I had it I thought about wreaking havoc on an opposition Kinda shockin', they want it static, with precision I'm automatic, quarterback, I ain't talkin' second Pack it, pack it up, I don't panic, better batter up Who the baddest, it don't matter cause we is your Everybody wants to be my enemy Spare the sympathy Everybody wants to be my enemy Oh, the misery Everybody wants to be my enemy Spell the sympathy Everybody wants to be my enemy Everywhere I swear I'll never be a saint Nowhere my enemy Everywhere I swear I'll never be a saint Look out for yourself", + "segments": [ + { + "id": 0, + "seek": 0, + "start": 2.24, + "end": 2.36, + "text": " I", + "tokens": [ + 50364, + 286, + 50464 + ], + "temperature": 0.4, + "avg_logprob": -0.9355003237724304, + "compression_ratio": 0.1111111111111111, + "no_speech_prob": 0.7811808586120605, + "confidence": 0.032, + "words": [ + { + "text": "I", + "start": 2.24, + "end": 2.36, + "confidence": 0.032 + } + ] + }, + { + "id": 1, + "seek": 9000, + "start": 90.18, + "end": 91.7, + "text": " As you're praying for my phone", + "tokens": [ + 50364, + 1018, + 291, + 434, + 15611, + 337, + 452, + 2593, + 50446 + ], + "temperature": 0.4, + "avg_logprob": -0.41540291383094397, + "compression_ratio": 1.5369458128078817, + "no_speech_prob": 0.7202673554420471, + "confidence": 0.716, + "words": [ + { + "text": "As", + "start": 90.18, + "end": 90.32, + "confidence": 0.357 + }, + { + "text": "you're", + "start": 90.32, + "end": 90.46, + "confidence": 0.893 + }, + { + "text": "praying", + "start": 90.46, + "end": 90.88, + "confidence": 0.966 + }, + { + "text": "for", + "start": 90.88, + "end": 91.12, + "confidence": 0.994 + }, + { + "text": "my", + "start": 91.12, + "end": 91.3, + "confidence": 0.997 + }, + { + "text": "phone", + "start": 91.3, + "end": 91.7, + "confidence": 0.353 + } + ] + }, + { + "id": 2, + "seek": 9000, + "start": 91.78, + "end": 93.22, + "text": " And the laughter in the holes", + "tokens": [ + 50446, + 400, + 264, + 13092, + 294, + 264, + 8118, + 50524 + ], + "temperature": 0.4, + "avg_logprob": -0.41540291383094397, + "compression_ratio": 1.5369458128078817, + "no_speech_prob": 0.7202673554420471, + "confidence": 0.864, + "words": [ + { + "text": "And", + "start": 91.78, + "end": 91.92, + "confidence": 0.885 + }, + { + "text": "the", + "start": 91.92, + "end": 92.1, + "confidence": 0.99 + }, + { + "text": "laughter", + "start": 92.1, + "end": 92.5, + "confidence": 0.993 + }, + { + "text": "in", + "start": 92.5, + "end": 92.78, + "confidence": 0.895 + }, + { + "text": "the", + "start": 92.78, + "end": 92.92, + "confidence": 0.995 + }, + { + "text": "holes", + "start": 92.92, + "end": 93.22, + "confidence": 0.538 + } + ] + }, + { + "id": 3, + "seek": 9000, + "start": 93.34, + "end": 94.76, + "text": " And the names that I've been called", + "tokens": [ + 50524, + 400, + 264, + 5288, + 300, + 286, + 600, + 668, + 1219, + 50604 + ], + "temperature": 0.4, + "avg_logprob": -0.41540291383094397, + "compression_ratio": 1.5369458128078817, + "no_speech_prob": 0.7202673554420471, + "confidence": 0.97, + "words": [ + { + "text": "And", + "start": 93.34, + "end": 93.48, + "confidence": 0.956 + }, + { + "text": "the", + "start": 93.48, + "end": 93.6, + "confidence": 0.994 + }, + { + "text": "names", + "start": 93.6, + "end": 93.86, + "confidence": 0.989 + }, + { + "text": "that", + "start": 93.86, + "end": 94.14, + "confidence": 0.982 + }, + { + "text": "I've", + "start": 94.14, + "end": 94.32, + "confidence": 0.946 + }, + { + "text": "been", + "start": 94.32, + "end": 94.5, + "confidence": 0.998 + }, + { + "text": "called", + "start": 94.5, + "end": 94.76, + "confidence": 0.955 + } + ] + }, + { + "id": 4, + "seek": 9000, + "start": 94.98, + "end": 96.38, + "text": " I stack it in my mind", + "tokens": [ + 50604, + 286, + 8630, + 309, + 294, + 452, + 1575, + 50681 + ], + "temperature": 0.4, + "avg_logprob": -0.41540291383094397, + "compression_ratio": 1.5369458128078817, + "no_speech_prob": 0.7202673554420471, + "confidence": 0.96, + "words": [ + { + "text": "I", + "start": 94.98, + "end": 95.14, + "confidence": 0.991 + }, + { + "text": "stack", + "start": 95.14, + "end": 95.46, + "confidence": 0.802 + }, + { + "text": "it", + "start": 95.46, + "end": 95.72, + "confidence": 0.996 + }, + { + "text": "in", + "start": 95.72, + "end": 95.8, + "confidence": 0.996 + }, + { + "text": "my", + "start": 95.8, + "end": 96.1, + "confidence": 0.995 + }, + { + "text": "mind", + "start": 96.1, + "end": 96.38, + "confidence": 0.999 + } + ] + }, + { + "id": 5, + "seek": 9000, + "start": 96.48, + "end": 97.82, + "text": " And I'm waiting for the time", + "tokens": [ + 50681, + 400, + 286, + 478, + 3806, + 337, + 264, + 565, + 50756 + ], + "temperature": 0.4, + "avg_logprob": -0.41540291383094397, + "compression_ratio": 1.5369458128078817, + "no_speech_prob": 0.7202673554420471, + "confidence": 0.989, + "words": [ + { + "text": "And", + "start": 96.48, + "end": 96.6, + "confidence": 0.971 + }, + { + "text": "I'm", + "start": 96.6, + "end": 96.74, + "confidence": 0.994 + }, + { + "text": "waiting", + "start": 96.74, + "end": 97.14, + "confidence": 0.978 + }, + { + "text": "for", + "start": 97.14, + "end": 97.34, + "confidence": 0.997 + }, + { + "text": "the", + "start": 97.34, + "end": 97.54, + "confidence": 0.996 + }, + { + "text": "time", + "start": 97.54, + "end": 97.82, + "confidence": 0.997 + } + ] + }, + { + "id": 6, + "seek": 9000, + "start": 98.0, + "end": 99.44, + "text": " When I show you what it's like", + "tokens": [ + 50756, + 1133, + 286, + 855, + 291, + 437, + 309, + 311, + 411, + 50834 + ], + "temperature": 0.4, + "avg_logprob": -0.41540291383094397, + "compression_ratio": 1.5369458128078817, + "no_speech_prob": 0.7202673554420471, + "confidence": 0.98, + "words": [ + { + "text": "When", + "start": 98.0, + "end": 98.14, + "confidence": 0.968 + }, + { + "text": "I", + "start": 98.14, + "end": 98.32, + "confidence": 0.996 + }, + { + "text": "show", + "start": 98.32, + "end": 98.5, + "confidence": 0.907 + }, + { + "text": "you", + "start": 98.5, + "end": 98.76, + "confidence": 0.994 + }, + { + "text": "what", + "start": 98.76, + "end": 98.94, + "confidence": 0.994 + }, + { + "text": "it's", + "start": 98.94, + "end": 99.24, + "confidence": 0.991 + }, + { + "text": "like", + "start": 99.24, + "end": 99.44, + "confidence": 0.999 + } + ] + }, + { + "id": 7, + "seek": 9000, + "start": 99.52, + "end": 101.26, + "text": " To be worse than in a mine", + "tokens": [ + 50834, + 1407, + 312, + 5324, + 813, + 294, + 257, + 3892, + 50923 + ], + "temperature": 0.4, + "avg_logprob": -0.41540291383094397, + "compression_ratio": 1.5369458128078817, + "no_speech_prob": 0.7202673554420471, + "confidence": 0.481, + "words": [ + { + "text": "To", + "start": 99.52, + "end": 99.72, + "confidence": 0.987 + }, + { + "text": "be", + "start": 99.72, + "end": 99.84, + "confidence": 0.999 + }, + { + "text": "worse", + "start": 99.84, + "end": 100.1, + "confidence": 0.472 + }, + { + "text": "than", + "start": 100.1, + "end": 100.38, + "confidence": 0.188 + }, + { + "text": "in", + "start": 100.38, + "end": 100.56, + "confidence": 0.284 + }, + { + "text": "a", + "start": 100.56, + "end": 100.9, + "confidence": 0.407 + }, + { + "text": "mine", + "start": 100.9, + "end": 101.26, + "confidence": 0.591 + } + ] + }, + { + "id": 8, + "seek": 9000, + "start": 101.36, + "end": 106.82, + "text": " Tell you, you're the greatest", + "tokens": [ + 50923, + 5115, + 291, + 11, + 291, + 434, + 264, + 6636, + 51215 + ], + "temperature": 0.4, + "avg_logprob": -0.41540291383094397, + "compression_ratio": 1.5369458128078817, + "no_speech_prob": 0.7202673554420471, + "confidence": 0.962, + "words": [ + { + "text": "Tell", + "start": 101.36, + "end": 102.24, + "confidence": 0.898 + }, + { + "text": "you,", + "start": 102.24, + "end": 102.92, + "confidence": 0.993 + }, + { + "text": "you're", + "start": 102.92, + "end": 103.82, + "confidence": 0.971 + }, + { + "text": "the", + "start": 103.82, + "end": 104.34, + "confidence": 0.969 + }, + { + "text": "greatest", + "start": 104.34, + "end": 106.82, + "confidence": 0.973 + } + ] + }, + { + "id": 9, + "seek": 9000, + "start": 107.22, + "end": 113.02, + "text": " But once you turn they hate us", + "tokens": [ + 51215, + 583, + 1564, + 291, + 1261, + 436, + 4700, + 505, + 51520 + ], + "temperature": 0.4, + "avg_logprob": -0.41540291383094397, + "compression_ratio": 1.5369458128078817, + "no_speech_prob": 0.7202673554420471, + "confidence": 0.862, + "words": [ + { + "text": "But", + "start": 107.22, + "end": 107.62, + "confidence": 0.996 + }, + { + "text": "once", + "start": 107.62, + "end": 108.44, + "confidence": 0.826 + }, + { + "text": "you", + "start": 108.44, + "end": 109.2, + "confidence": 0.998 + }, + { + "text": "turn", + "start": 109.2, + "end": 109.9, + "confidence": 0.908 + }, + { + "text": "they", + "start": 109.9, + "end": 110.38, + "confidence": 0.481 + }, + { + "text": "hate", + "start": 110.38, + "end": 111.92, + "confidence": 0.988 + }, + { + "text": "us", + "start": 111.92, + "end": 113.02, + "confidence": 0.999 + } + ] + }, + { + "id": 10, + "seek": 9000, + "start": 114.64, + "end": 116.2, + "text": " Oh, the misery", + "tokens": [ + 51585, + 876, + 11, + 264, + 32309, + 51700 + ], + "temperature": 0.4, + "avg_logprob": -0.41540291383094397, + "compression_ratio": 1.5369458128078817, + "no_speech_prob": 0.7202673554420471, + "confidence": 0.967, + "words": [ + { + "text": "Oh,", + "start": 114.64, + "end": 115.16, + "confidence": 0.912 + }, + { + "text": "the", + "start": 115.22, + "end": 115.44, + "confidence": 0.993 + }, + { + "text": "misery", + "start": 115.44, + "end": 116.2, + "confidence": 0.999 + } + ] + }, + { + "id": 11, + "seek": 9000, + "start": 116.84, + "end": 119.3, + "text": " Everybody wants to be my enemy", + "tokens": [ + 51700, + 7646, + 2738, + 281, + 312, + 452, + 5945, + 51860 + ], + "temperature": 0.4, + "avg_logprob": -0.41540291383094397, + "compression_ratio": 1.5369458128078817, + "no_speech_prob": 0.7202673554420471, + "confidence": 0.944, + "words": [ + { + "text": "Everybody", + "start": 116.84, + "end": 117.6, + "confidence": 0.724 + }, + { + "text": "wants", + "start": 117.6, + "end": 117.96, + "confidence": 0.993 + }, + { + "text": "to", + "start": 117.96, + "end": 118.14, + "confidence": 0.998 + }, + { + "text": "be", + "start": 118.14, + "end": 118.26, + "confidence": 0.999 + }, + { + "text": "my", + "start": 118.26, + "end": 118.62, + "confidence": 0.997 + }, + { + "text": "enemy", + "start": 118.62, + "end": 119.3, + "confidence": 0.988 + } + ] + }, + { + "id": 12, + "seek": 11992, + "start": 119.96, + "end": 126.26, + "text": " I smell the sympathy Everybody wants to be my enemy", + "tokens": [ + 50364, + 286, + 4316, + 264, + 33240, + 7646, + 2738, + 281, + 312, + 452, + 5945, + 50686 + ], + "temperature": 0.4, + "avg_logprob": -0.38010619236872745, + "compression_ratio": 1.755458515283843, + "no_speech_prob": 0.7215486168861389, + "confidence": 0.725, + "words": [ + { + "text": "I", + "start": 119.96, + "end": 120.78, + "confidence": 0.324 + }, + { + "text": "smell", + "start": 120.78, + "end": 121.42, + "confidence": 0.796 + }, + { + "text": "the", + "start": 121.42, + "end": 121.72, + "confidence": 0.857 + }, + { + "text": "sympathy", + "start": 121.72, + "end": 122.54, + "confidence": 0.981 + }, + { + "text": "Everybody", + "start": 122.54, + "end": 123.8, + "confidence": 0.265 + }, + { + "text": "wants", + "start": 123.8, + "end": 124.18, + "confidence": 0.984 + }, + { + "text": "to", + "start": 124.18, + "end": 124.48, + "confidence": 0.994 + }, + { + "text": "be", + "start": 124.48, + "end": 124.86, + "confidence": 0.994 + }, + { + "text": "my", + "start": 124.86, + "end": 125.58, + "confidence": 0.747 + }, + { + "text": "enemy", + "start": 125.58, + "end": 126.26, + "confidence": 0.967 + } + ] + }, + { + "id": 13, + "seek": 11992, + "start": 126.6, + "end": 132.52, + "text": " Look out for yourself My enemy", + "tokens": [ + 50686, + 2053, + 484, + 337, + 1803, + 1222, + 5945, + 50994 + ], + "temperature": 0.4, + "avg_logprob": -0.38010619236872745, + "compression_ratio": 1.755458515283843, + "no_speech_prob": 0.7215486168861389, + "confidence": 0.712, + "words": [ + { + "text": "Look", + "start": 126.6, + "end": 130.08, + "confidence": 0.463 + }, + { + "text": "out", + "start": 130.08, + "end": 130.26, + "confidence": 0.74 + }, + { + "text": "for", + "start": 130.26, + "end": 130.48, + "confidence": 0.993 + }, + { + "text": "yourself", + "start": 130.48, + "end": 130.98, + "confidence": 0.983 + }, + { + "text": "My", + "start": 130.98, + "end": 131.78, + "confidence": 0.399 + }, + { + "text": "enemy", + "start": 131.78, + "end": 132.52, + "confidence": 0.978 + } + ] + }, + { + "id": 14, + "seek": 11992, + "start": 133.92, + "end": 137.26, + "text": " Look out for yourself", + "tokens": [ + 50994, + 2053, + 484, + 337, + 1803, + 51230 + ], + "temperature": 0.4, + "avg_logprob": -0.38010619236872745, + "compression_ratio": 1.755458515283843, + "no_speech_prob": 0.7215486168861389, + "confidence": 0.977, + "words": [ + { + "text": "Look", + "start": 133.92, + "end": 134.06, + "confidence": 0.923 + }, + { + "text": "out", + "start": 134.06, + "end": 136.56, + "confidence": 0.989 + }, + { + "text": "for", + "start": 136.56, + "end": 136.74, + "confidence": 0.999 + }, + { + "text": "yourself", + "start": 136.74, + "end": 137.26, + "confidence": 0.999 + } + ] + }, + { + "id": 15, + "seek": 11992, + "start": 137.62, + "end": 140.18, + "text": " Look, okay, I'm Hoping that somebody pray for me", + "tokens": [ + 51230, + 2053, + 11, + 1392, + 11, + 286, + 478, + 13438, + 278, + 300, + 2618, + 3690, + 337, + 385, + 51374 + ], + "temperature": 0.4, + "avg_logprob": -0.38010619236872745, + "compression_ratio": 1.755458515283843, + "no_speech_prob": 0.7215486168861389, + "confidence": 0.779, + "words": [ + { + "text": "Look,", + "start": 137.62, + "end": 137.88, + "confidence": 0.774 + }, + { + "text": "okay,", + "start": 138.44, + "end": 138.58, + "confidence": 0.665 + }, + { + "text": "I'm", + "start": 138.76, + "end": 138.94, + "confidence": 0.965 + }, + { + "text": "Hoping", + "start": 138.94, + "end": 139.22, + "confidence": 0.414 + }, + { + "text": "that", + "start": 139.22, + "end": 139.34, + "confidence": 0.967 + }, + { + "text": "somebody", + "start": 139.34, + "end": 139.58, + "confidence": 0.985 + }, + { + "text": "pray", + "start": 139.58, + "end": 139.86, + "confidence": 0.855 + }, + { + "text": "for", + "start": 139.86, + "end": 140.02, + "confidence": 0.959 + }, + { + "text": "me", + "start": 140.02, + "end": 140.18, + "confidence": 0.998 + } + ] + }, + { + "id": 16, + "seek": 11992, + "start": 140.36, + "end": 143.2, + "text": " I'm praying that somebody vote for me I'm staying where nobody's supposed to be", + "tokens": [ + 51374, + 286, + 478, + 15611, + 300, + 2618, + 4740, + 337, + 385, + 286, + 478, + 7939, + 689, + 5079, + 311, + 3442, + 281, + 312, + 51524 + ], + "temperature": 0.4, + "avg_logprob": -0.38010619236872745, + "compression_ratio": 1.755458515283843, + "no_speech_prob": 0.7215486168861389, + "confidence": 0.846, + "words": [ + { + "text": "I'm", + "start": 140.36, + "end": 140.48, + "confidence": 0.788 + }, + { + "text": "praying", + "start": 140.48, + "end": 140.64, + "confidence": 0.869 + }, + { + "text": "that", + "start": 140.64, + "end": 140.84, + "confidence": 0.97 + }, + { + "text": "somebody", + "start": 140.84, + "end": 141.1, + "confidence": 0.996 + }, + { + "text": "vote", + "start": 141.1, + "end": 141.34, + "confidence": 0.372 + }, + { + "text": "for", + "start": 141.34, + "end": 141.5, + "confidence": 0.999 + }, + { + "text": "me", + "start": 141.5, + "end": 141.7, + "confidence": 0.999 + }, + { + "text": "I'm", + "start": 141.7, + "end": 141.96, + "confidence": 0.902 + }, + { + "text": "staying", + "start": 141.96, + "end": 142.16, + "confidence": 0.696 + }, + { + "text": "where", + "start": 142.16, + "end": 142.34, + "confidence": 0.964 + }, + { + "text": "nobody's", + "start": 142.34, + "end": 142.68, + "confidence": 0.768 + }, + { + "text": "supposed", + "start": 142.68, + "end": 142.96, + "confidence": 0.97 + }, + { + "text": "to", + "start": 142.96, + "end": 143.1, + "confidence": 0.996 + }, + { + "text": "be", + "start": 143.1, + "end": 143.2, + "confidence": 0.975 + } + ] + }, + { + "id": 17, + "seek": 11992, + "start": 143.24, + "end": 146.29, + "text": " I propose to be in a wreck of emotions Ready to go whenever she let me know", + "tokens": [ + 51524, + 286, + 17421, + 281, + 312, + 294, + 257, + 21478, + 295, + 8462, + 9944, + 281, + 352, + 5699, + 750, + 718, + 385, + 458, + 51684 + ], + "temperature": 0.4, + "avg_logprob": -0.38010619236872745, + "compression_ratio": 1.755458515283843, + "no_speech_prob": 0.7215486168861389, + "confidence": 0.711, + "words": [ + { + "text": "I", + "start": 143.24, + "end": 143.4, + "confidence": 0.432 + }, + { + "text": "propose", + "start": 143.4, + "end": 143.72, + "confidence": 0.301 + }, + { + "text": "to", + "start": 143.72, + "end": 143.9, + "confidence": 0.838 + }, + { + "text": "be", + "start": 143.9, + "end": 144.04, + "confidence": 0.545 + }, + { + "text": "in", + "start": 144.04, + "end": 144.18, + "confidence": 0.741 + }, + { + "text": "a", + "start": 144.18, + "end": 144.3, + "confidence": 0.678 + }, + { + "text": "wreck", + "start": 144.3, + "end": 144.4, + "confidence": 0.392 + }, + { + "text": "of", + "start": 144.4, + "end": 144.54, + "confidence": 0.983 + }, + { + "text": "emotions", + "start": 144.54, + "end": 145.0, + "confidence": 0.916 + }, + { + "text": "Ready", + "start": 145.0, + "end": 145.3, + "confidence": 0.864 + }, + { + "text": "to", + "start": 145.3, + "end": 145.46, + "confidence": 0.994 + }, + { + "text": "go", + "start": 145.46, + "end": 145.6, + "confidence": 0.996 + }, + { + "text": "whenever", + "start": 145.6, + "end": 145.8, + "confidence": 0.844 + }, + { + "text": "she", + "start": 145.8, + "end": 145.96, + "confidence": 0.428 + }, + { + "text": "let", + "start": 145.96, + "end": 146.08, + "confidence": 0.954 + }, + { + "text": "me", + "start": 146.08, + "end": 146.16, + "confidence": 0.999 + }, + { + "text": "know", + "start": 146.16, + "end": 146.29, + "confidence": 0.977 + } + ] + }, + { + "id": 18, + "seek": 11992, + "start": 146.29, + "end": 149.78, + "text": " The road is long so put the pedal into the flow The enemy on my trail, my energy unavailable", + "tokens": [ + 51684, + 440, + 3060, + 307, + 938, + 370, + 829, + 264, + 19122, + 666, + 264, + 3095, + 440, + 5945, + 322, + 452, + 9924, + 11, + 452, + 2281, + 36541, + 32699, + 51860 + ], + "temperature": 0.4, + "avg_logprob": -0.38010619236872745, + "compression_ratio": 1.755458515283843, + "no_speech_prob": 0.7215486168861389, + "confidence": 0.912, + "words": [ + { + "text": "The", + "start": 146.29, + "end": 146.52, + "confidence": 0.897 + }, + { + "text": "road", + "start": 146.52, + "end": 146.68, + "confidence": 0.986 + }, + { + "text": "is", + "start": 146.68, + "end": 146.78, + "confidence": 0.971 + }, + { + "text": "long", + "start": 146.78, + "end": 146.92, + "confidence": 0.913 + }, + { + "text": "so", + "start": 146.92, + "end": 147.04, + "confidence": 0.67 + }, + { + "text": "put", + "start": 147.04, + "end": 147.16, + "confidence": 0.954 + }, + { + "text": "the", + "start": 147.16, + "end": 147.28, + "confidence": 0.975 + }, + { + "text": "pedal", + "start": 147.28, + "end": 147.42, + "confidence": 0.924 + }, + { + "text": "into", + "start": 147.42, + "end": 147.6, + "confidence": 0.946 + }, + { + "text": "the", + "start": 147.6, + "end": 147.74, + "confidence": 0.992 + }, + { + "text": "flow", + "start": 147.74, + "end": 147.88, + "confidence": 0.844 + }, + { + "text": "The", + "start": 147.88, + "end": 148.08, + "confidence": 0.71 + }, + { + "text": "enemy", + "start": 148.08, + "end": 148.26, + "confidence": 0.887 + }, + { + "text": "on", + "start": 148.26, + "end": 148.38, + "confidence": 0.969 + }, + { + "text": "my", + "start": 148.38, + "end": 148.5, + "confidence": 0.982 + }, + { + "text": "trail,", + "start": 148.5, + "end": 148.64, + "confidence": 0.992 + }, + { + "text": "my", + "start": 148.72, + "end": 148.86, + "confidence": 0.99 + }, + { + "text": "energy", + "start": 148.86, + "end": 149.1, + "confidence": 0.992 + }, + { + "text": "unavailable", + "start": 149.1, + "end": 149.78, + "confidence": 0.875 + } + ] + }, + { + "id": 19, + "seek": 14984, + "start": 150.02, + "end": 151.18, + "text": " I'ma tell the master the way go", + "tokens": [ + 50364, + 286, + 478, + 64, + 980, + 264, + 4505, + 264, + 636, + 352, + 50436 + ], + "temperature": 0.4, + "avg_logprob": -0.45425062569958424, + "compression_ratio": 1.7374631268436578, + "no_speech_prob": 0.7155851125717163, + "confidence": 0.592, + "words": [ + { + "text": "I'ma", + "start": 150.02, + "end": 150.24, + "confidence": 0.68 + }, + { + "text": "tell", + "start": 150.24, + "end": 150.36, + "confidence": 0.983 + }, + { + "text": "the", + "start": 150.36, + "end": 150.46, + "confidence": 0.248 + }, + { + "text": "master", + "start": 150.46, + "end": 150.68, + "confidence": 0.223 + }, + { + "text": "the", + "start": 150.68, + "end": 150.9, + "confidence": 0.783 + }, + { + "text": "way", + "start": 150.9, + "end": 151.0, + "confidence": 0.991 + }, + { + "text": "go", + "start": 151.0, + "end": 151.18, + "confidence": 0.673 + } + ] + }, + { + "id": 20, + "seek": 14984, + "start": 151.2, + "end": 152.54, + "text": " Hey, when I'm flat on my track to the top", + "tokens": [ + 50436, + 1911, + 11, + 562, + 286, + 478, + 4962, + 322, + 452, + 2837, + 281, + 264, + 1192, + 50500 + ], + "temperature": 0.4, + "avg_logprob": -0.45425062569958424, + "compression_ratio": 1.7374631268436578, + "no_speech_prob": 0.7155851125717163, + "confidence": 0.589, + "words": [ + { + "text": "Hey,", + "start": 151.2, + "end": 151.4, + "confidence": 0.215 + }, + { + "text": "when", + "start": 151.46, + "end": 151.56, + "confidence": 0.811 + }, + { + "text": "I'm", + "start": 151.56, + "end": 151.72, + "confidence": 0.523 + }, + { + "text": "flat", + "start": 151.72, + "end": 151.8, + "confidence": 0.241 + }, + { + "text": "on", + "start": 151.8, + "end": 151.9, + "confidence": 0.636 + }, + { + "text": "my", + "start": 151.9, + "end": 152.02, + "confidence": 0.961 + }, + { + "text": "track", + "start": 152.02, + "end": 152.16, + "confidence": 0.482 + }, + { + "text": "to", + "start": 152.16, + "end": 152.32, + "confidence": 0.874 + }, + { + "text": "the", + "start": 152.32, + "end": 152.42, + "confidence": 0.996 + }, + { + "text": "top", + "start": 152.42, + "end": 152.54, + "confidence": 0.998 + } + ] + }, + { + "id": 21, + "seek": 14984, + "start": 152.54, + "end": 154.34, + "text": " I been out of shape, thinking that I'm a box of an astronaut", + "tokens": [ + 50500, + 286, + 668, + 484, + 295, + 3909, + 11, + 1953, + 300, + 286, + 478, + 257, + 2424, + 295, + 364, + 18516, + 50592 + ], + "temperature": 0.4, + "avg_logprob": -0.45425062569958424, + "compression_ratio": 1.7374631268436578, + "no_speech_prob": 0.7155851125717163, + "confidence": 0.725, + "words": [ + { + "text": "I", + "start": 152.54, + "end": 152.7, + "confidence": 0.988 + }, + { + "text": "been", + "start": 152.7, + "end": 152.76, + "confidence": 0.617 + }, + { + "text": "out", + "start": 152.76, + "end": 152.9, + "confidence": 0.679 + }, + { + "text": "of", + "start": 152.9, + "end": 153.02, + "confidence": 0.959 + }, + { + "text": "shape,", + "start": 153.02, + "end": 153.1, + "confidence": 0.999 + }, + { + "text": "thinking", + "start": 153.16, + "end": 153.32, + "confidence": 0.667 + }, + { + "text": "that", + "start": 153.32, + "end": 153.46, + "confidence": 0.261 + }, + { + "text": "I'm", + "start": 153.46, + "end": 153.62, + "confidence": 0.736 + }, + { + "text": "a", + "start": 153.62, + "end": 153.72, + "confidence": 0.725 + }, + { + "text": "box", + "start": 153.72, + "end": 153.76, + "confidence": 0.878 + }, + { + "text": "of", + "start": 153.76, + "end": 153.9, + "confidence": 0.483 + }, + { + "text": "an", + "start": 153.9, + "end": 154.04, + "confidence": 0.986 + }, + { + "text": "astronaut", + "start": 154.04, + "end": 154.34, + "confidence": 0.984 + } + ] + }, + { + "id": 22, + "seek": 14984, + "start": 154.5, + "end": 156.42, + "text": " Blasted off the planet, rocked the cars, catastrophic", + "tokens": [ + 50592, + 2177, + 34440, + 766, + 264, + 5054, + 11, + 3727, + 292, + 264, + 5163, + 11, + 34915, + 50692 + ], + "temperature": 0.4, + "avg_logprob": -0.45425062569958424, + "compression_ratio": 1.7374631268436578, + "no_speech_prob": 0.7155851125717163, + "confidence": 0.742, + "words": [ + { + "text": "Blasted", + "start": 154.5, + "end": 154.82, + "confidence": 0.817 + }, + { + "text": "off", + "start": 154.82, + "end": 155.02, + "confidence": 0.981 + }, + { + "text": "the", + "start": 155.02, + "end": 155.18, + "confidence": 0.95 + }, + { + "text": "planet,", + "start": 155.18, + "end": 155.36, + "confidence": 0.994 + }, + { + "text": "rocked", + "start": 155.44, + "end": 155.66, + "confidence": 0.691 + }, + { + "text": "the", + "start": 155.66, + "end": 155.74, + "confidence": 0.801 + }, + { + "text": "cars,", + "start": 155.74, + "end": 155.9, + "confidence": 0.308 + }, + { + "text": "catastrophic", + "start": 155.9, + "end": 156.42, + "confidence": 0.693 + } + ] + }, + { + "id": 23, + "seek": 14984, + "start": 156.44, + "end": 158.18, + "text": " And it matters more because I had it, now I had it", + "tokens": [ + 50692, + 400, + 309, + 7001, + 544, + 570, + 286, + 632, + 309, + 11, + 586, + 286, + 632, + 309, + 50777 + ], + "temperature": 0.4, + "avg_logprob": -0.45425062569958424, + "compression_ratio": 1.7374631268436578, + "no_speech_prob": 0.7155851125717163, + "confidence": 0.787, + "words": [ + { + "text": "And", + "start": 156.44, + "end": 156.64, + "confidence": 0.858 + }, + { + "text": "it", + "start": 156.64, + "end": 156.78, + "confidence": 0.678 + }, + { + "text": "matters", + "start": 156.78, + "end": 156.96, + "confidence": 0.996 + }, + { + "text": "more", + "start": 156.96, + "end": 157.18, + "confidence": 0.981 + }, + { + "text": "because", + "start": 157.18, + "end": 157.42, + "confidence": 0.749 + }, + { + "text": "I", + "start": 157.42, + "end": 157.56, + "confidence": 0.703 + }, + { + "text": "had", + "start": 157.56, + "end": 157.66, + "confidence": 0.951 + }, + { + "text": "it,", + "start": 157.66, + "end": 157.8, + "confidence": 0.986 + }, + { + "text": "now", + "start": 157.8, + "end": 157.94, + "confidence": 0.56 + }, + { + "text": "I", + "start": 157.94, + "end": 158.06, + "confidence": 0.754 + }, + { + "text": "had", + "start": 158.06, + "end": 158.12, + "confidence": 0.937 + }, + { + "text": "it", + "start": 158.12, + "end": 158.18, + "confidence": 0.51 + } + ] + }, + { + "id": 24, + "seek": 14984, + "start": 158.18, + "end": 159.84, + "text": " I thought about wreaking havoc on an opposition", + "tokens": [ + 50777, + 286, + 1194, + 466, + 46674, + 2456, + 47367, + 322, + 364, + 13504, + 50864 + ], + "temperature": 0.4, + "avg_logprob": -0.45425062569958424, + "compression_ratio": 1.7374631268436578, + "no_speech_prob": 0.7155851125717163, + "confidence": 0.959, + "words": [ + { + "text": "I", + "start": 158.18, + "end": 158.24, + "confidence": 0.915 + }, + { + "text": "thought", + "start": 158.24, + "end": 158.38, + "confidence": 0.982 + }, + { + "text": "about", + "start": 158.38, + "end": 158.58, + "confidence": 0.981 + }, + { + "text": "wreaking", + "start": 158.58, + "end": 158.86, + "confidence": 0.978 + }, + { + "text": "havoc", + "start": 158.86, + "end": 159.08, + "confidence": 1.0 + }, + { + "text": "on", + "start": 159.08, + "end": 159.3, + "confidence": 0.911 + }, + { + "text": "an", + "start": 159.3, + "end": 159.46, + "confidence": 0.909 + }, + { + "text": "opposition", + "start": 159.46, + "end": 159.84, + "confidence": 0.984 + } + ] + }, + { + "id": 25, + "seek": 14984, + "start": 159.86, + "end": 161.56, + "text": " Kinda shockin', they want it static, with precision", + "tokens": [ + 50864, + 35553, + 5588, + 259, + 6098, + 436, + 528, + 309, + 13437, + 11, + 365, + 18356, + 50952 + ], + "temperature": 0.4, + "avg_logprob": -0.45425062569958424, + "compression_ratio": 1.7374631268436578, + "no_speech_prob": 0.7155851125717163, + "confidence": 0.572, + "words": [ + { + "text": "Kinda", + "start": 159.86, + "end": 160.1, + "confidence": 0.654 + }, + { + "text": "shockin',", + "start": 160.1, + "end": 160.48, + "confidence": 0.381 + }, + { + "text": "they", + "start": 160.48, + "end": 160.6, + "confidence": 0.305 + }, + { + "text": "want", + "start": 160.6, + "end": 160.74, + "confidence": 0.57 + }, + { + "text": "it", + "start": 160.74, + "end": 160.88, + "confidence": 0.695 + }, + { + "text": "static,", + "start": 160.88, + "end": 161.02, + "confidence": 0.986 + }, + { + "text": "with", + "start": 161.14, + "end": 161.28, + "confidence": 0.733 + }, + { + "text": "precision", + "start": 161.28, + "end": 161.56, + "confidence": 0.794 + } + ] + }, + { + "id": 26, + "seek": 14984, + "start": 161.62, + "end": 163.36, + "text": " I'm automatic, quarterback, I ain't talkin' second", + "tokens": [ + 50952, + 286, + 478, + 12509, + 11, + 31952, + 11, + 286, + 7862, + 380, + 39243, + 6, + 1150, + 51043 + ], + "temperature": 0.4, + "avg_logprob": -0.45425062569958424, + "compression_ratio": 1.7374631268436578, + "no_speech_prob": 0.7155851125717163, + "confidence": 0.812, + "words": [ + { + "text": "I'm", + "start": 161.62, + "end": 161.88, + "confidence": 0.963 + }, + { + "text": "automatic,", + "start": 161.88, + "end": 162.18, + "confidence": 0.961 + }, + { + "text": "quarterback,", + "start": 162.56, + "end": 162.58, + "confidence": 0.667 + }, + { + "text": "I", + "start": 162.66, + "end": 162.78, + "confidence": 0.727 + }, + { + "text": "ain't", + "start": 162.78, + "end": 162.9, + "confidence": 0.984 + }, + { + "text": "talkin'", + "start": 162.9, + "end": 163.2, + "confidence": 0.747 + }, + { + "text": "second", + "start": 163.2, + "end": 163.36, + "confidence": 0.536 + } + ] + }, + { + "id": 27, + "seek": 14984, + "start": 163.36, + "end": 165.2, + "text": " Pack it, pack it up, I don't panic, better batter up", + "tokens": [ + 51043, + 18466, + 309, + 11, + 2844, + 309, + 493, + 11, + 286, + 500, + 380, + 14783, + 11, + 1101, + 4220, + 493, + 51132 + ], + "temperature": 0.4, + "avg_logprob": -0.45425062569958424, + "compression_ratio": 1.7374631268436578, + "no_speech_prob": 0.7155851125717163, + "confidence": 0.789, + "words": [ + { + "text": "Pack", + "start": 163.36, + "end": 163.6, + "confidence": 0.939 + }, + { + "text": "it,", + "start": 163.6, + "end": 163.68, + "confidence": 0.893 + }, + { + "text": "pack", + "start": 163.7, + "end": 163.88, + "confidence": 0.962 + }, + { + "text": "it", + "start": 163.88, + "end": 164.02, + "confidence": 0.998 + }, + { + "text": "up,", + "start": 164.02, + "end": 164.12, + "confidence": 0.979 + }, + { + "text": "I", + "start": 164.12, + "end": 164.22, + "confidence": 0.974 + }, + { + "text": "don't", + "start": 164.22, + "end": 164.36, + "confidence": 0.888 + }, + { + "text": "panic,", + "start": 164.36, + "end": 164.56, + "confidence": 0.999 + }, + { + "text": "better", + "start": 164.62, + "end": 164.88, + "confidence": 0.568 + }, + { + "text": "batter", + "start": 164.88, + "end": 165.02, + "confidence": 0.176 + }, + { + "text": "up", + "start": 165.02, + "end": 165.2, + "confidence": 0.963 + } + ] + }, + { + "id": 28, + "seek": 14984, + "start": 165.2, + "end": 166.76, + "text": " Who the baddest, it don't matter cause we is your", + "tokens": [ + 51132, + 2102, + 264, + 1578, + 23748, + 11, + 309, + 500, + 380, + 1871, + 3082, + 321, + 307, + 428, + 51210 + ], + "temperature": 0.4, + "avg_logprob": -0.45425062569958424, + "compression_ratio": 1.7374631268436578, + "no_speech_prob": 0.7155851125717163, + "confidence": 0.714, + "words": [ + { + "text": "Who", + "start": 165.2, + "end": 165.4, + "confidence": 0.994 + }, + { + "text": "the", + "start": 165.4, + "end": 165.54, + "confidence": 0.954 + }, + { + "text": "baddest,", + "start": 165.54, + "end": 165.78, + "confidence": 0.833 + }, + { + "text": "it", + "start": 165.8, + "end": 165.9, + "confidence": 0.993 + }, + { + "text": "don't", + "start": 165.9, + "end": 166.04, + "confidence": 0.995 + }, + { + "text": "matter", + "start": 166.04, + "end": 166.18, + "confidence": 0.999 + }, + { + "text": "cause", + "start": 166.18, + "end": 166.38, + "confidence": 0.235 + }, + { + "text": "we", + "start": 166.38, + "end": 166.56, + "confidence": 0.956 + }, + { + "text": "is", + "start": 166.56, + "end": 166.64, + "confidence": 0.208 + }, + { + "text": "your", + "start": 166.64, + "end": 166.76, + "confidence": 0.577 + } + ] + }, + { + "id": 29, + "seek": 14984, + "start": 166.86, + "end": 169.82, + "text": " Everybody wants to be my enemy", + "tokens": [ + 51210, + 7646, + 2738, + 281, + 312, + 452, + 5945, + 51402 + ], + "temperature": 0.4, + "avg_logprob": -0.45425062569958424, + "compression_ratio": 1.7374631268436578, + "no_speech_prob": 0.7155851125717163, + "confidence": 0.976, + "words": [ + { + "text": "Everybody", + "start": 166.86, + "end": 167.44, + "confidence": 0.922 + }, + { + "text": "wants", + "start": 167.44, + "end": 167.82, + "confidence": 0.985 + }, + { + "text": "to", + "start": 167.82, + "end": 168.0, + "confidence": 0.998 + }, + { + "text": "be", + "start": 168.0, + "end": 168.16, + "confidence": 0.998 + }, + { + "text": "my", + "start": 168.16, + "end": 168.44, + "confidence": 0.993 + }, + { + "text": "enemy", + "start": 168.44, + "end": 169.82, + "confidence": 0.965 + } + ] + }, + { + "id": 30, + "seek": 14984, + "start": 170.62, + "end": 172.24, + "text": " Spare the sympathy", + "tokens": [ + 51402, + 1738, + 543, + 264, + 33240, + 51522 + ], + "temperature": 0.4, + "avg_logprob": -0.45425062569958424, + "compression_ratio": 1.7374631268436578, + "no_speech_prob": 0.7155851125717163, + "confidence": 0.815, + "words": [ + { + "text": "Spare", + "start": 170.62, + "end": 171.28, + "confidence": 0.711 + }, + { + "text": "the", + "start": 171.28, + "end": 171.54, + "confidence": 0.974 + }, + { + "text": "sympathy", + "start": 171.54, + "end": 172.24, + "confidence": 0.896 + } + ] + }, + { + "id": 31, + "seek": 14984, + "start": 173.1, + "end": 176.24, + "text": " Everybody wants to be my enemy", + "tokens": [ + 51522, + 7646, + 2738, + 281, + 312, + 452, + 5945, + 51720 + ], + "temperature": 0.4, + "avg_logprob": -0.45425062569958424, + "compression_ratio": 1.7374631268436578, + "no_speech_prob": 0.7155851125717163, + "confidence": 0.984, + "words": [ + { + "text": "Everybody", + "start": 173.1, + "end": 173.7, + "confidence": 0.994 + }, + { + "text": "wants", + "start": 173.7, + "end": 174.06, + "confidence": 0.994 + }, + { + "text": "to", + "start": 174.06, + "end": 174.36, + "confidence": 0.999 + }, + { + "text": "be", + "start": 174.36, + "end": 174.72, + "confidence": 0.999 + }, + { + "text": "my", + "start": 174.72, + "end": 175.46, + "confidence": 0.923 + }, + { + "text": "enemy", + "start": 175.46, + "end": 176.24, + "confidence": 0.998 + } + ] + }, + { + "id": 32, + "seek": 14984, + "start": 176.86, + "end": 178.48, + "text": " Oh, the misery", + "tokens": [ + 51720, + 876, + 11, + 264, + 32309, + 51834 + ], + "temperature": 0.4, + "avg_logprob": -0.45425062569958424, + "compression_ratio": 1.7374631268436578, + "no_speech_prob": 0.7155851125717163, + "confidence": 0.879, + "words": [ + { + "text": "Oh,", + "start": 176.86, + "end": 177.5, + "confidence": 0.692 + }, + { + "text": "the", + "start": 177.56, + "end": 177.76, + "confidence": 0.984 + }, + { + "text": "misery", + "start": 177.76, + "end": 178.48, + "confidence": 0.999 + } + ] + }, + { + "id": 33, + "seek": 17924, + "start": 179.3, + "end": 181.62, + "text": " Everybody wants to be my enemy", + "tokens": [ + 50364, + 7646, + 2738, + 281, + 312, + 452, + 5945, + 50514 + ], + "temperature": 0.4, + "avg_logprob": -0.35596295406943873, + "compression_ratio": 1.8440366972477065, + "no_speech_prob": 0.4185682237148285, + "confidence": 0.949, + "words": [ + { + "text": "Everybody", + "start": 179.3, + "end": 179.92, + "confidence": 0.776 + }, + { + "text": "wants", + "start": 179.92, + "end": 180.3, + "confidence": 0.98 + }, + { + "text": "to", + "start": 180.3, + "end": 180.48, + "confidence": 0.997 + }, + { + "text": "be", + "start": 180.48, + "end": 180.62, + "confidence": 0.998 + }, + { + "text": "my", + "start": 180.62, + "end": 180.92, + "confidence": 0.992 + }, + { + "text": "enemy", + "start": 180.92, + "end": 181.62, + "confidence": 0.973 + } + ] + }, + { + "id": 34, + "seek": 17924, + "start": 183.08, + "end": 184.64, + "text": " Spell the sympathy", + "tokens": [ + 50514, + 3550, + 285, + 264, + 33240, + 50664 + ], + "temperature": 0.4, + "avg_logprob": -0.35596295406943873, + "compression_ratio": 1.8440366972477065, + "no_speech_prob": 0.4185682237148285, + "confidence": 0.56, + "words": [ + { + "text": "Spell", + "start": 183.08, + "end": 183.78, + "confidence": 0.345 + }, + { + "text": "the", + "start": 183.78, + "end": 184.08, + "confidence": 0.926 + }, + { + "text": "sympathy", + "start": 184.08, + "end": 184.64, + "confidence": 0.892 + } + ] + }, + { + "id": 35, + "seek": 17924, + "start": 185.5, + "end": 188.48, + "text": " Everybody wants to be my enemy", + "tokens": [ + 50664, + 7646, + 2738, + 281, + 312, + 452, + 5945, + 50814 + ], + "temperature": 0.4, + "avg_logprob": -0.35596295406943873, + "compression_ratio": 1.8440366972477065, + "no_speech_prob": 0.4185682237148285, + "confidence": 0.961, + "words": [ + { + "text": "Everybody", + "start": 185.5, + "end": 186.16, + "confidence": 0.99 + }, + { + "text": "wants", + "start": 186.16, + "end": 186.52, + "confidence": 0.988 + }, + { + "text": "to", + "start": 186.52, + "end": 186.76, + "confidence": 0.999 + }, + { + "text": "be", + "start": 186.76, + "end": 187.28, + "confidence": 0.999 + }, + { + "text": "my", + "start": 187.28, + "end": 187.94, + "confidence": 0.811 + }, + { + "text": "enemy", + "start": 187.94, + "end": 188.48, + "confidence": 0.992 + } + ] + }, + { + "id": 36, + "seek": 17924, + "start": 188.9, + "end": 192.06, + "text": " Everywhere I swear I'll never be a saint", + "tokens": [ + 50814, + 37322, + 286, + 11902, + 286, + 603, + 1128, + 312, + 257, + 28374, + 51014 + ], + "temperature": 0.4, + "avg_logprob": -0.35596295406943873, + "compression_ratio": 1.8440366972477065, + "no_speech_prob": 0.4185682237148285, + "confidence": 0.558, + "words": [ + { + "text": "Everywhere", + "start": 188.9, + "end": 189.58, + "confidence": 0.045 + }, + { + "text": "I", + "start": 189.58, + "end": 190.14, + "confidence": 0.402 + }, + { + "text": "swear", + "start": 190.14, + "end": 190.56, + "confidence": 0.99 + }, + { + "text": "I'll", + "start": 190.56, + "end": 190.96, + "confidence": 0.744 + }, + { + "text": "never", + "start": 190.96, + "end": 191.32, + "confidence": 0.996 + }, + { + "text": "be", + "start": 191.32, + "end": 191.68, + "confidence": 0.995 + }, + { + "text": "a", + "start": 191.68, + "end": 191.9, + "confidence": 0.61 + }, + { + "text": "saint", + "start": 191.9, + "end": 192.06, + "confidence": 0.87 + } + ] + }, + { + "id": 37, + "seek": 17924, + "start": 192.1, + "end": 194.78, + "text": " Nowhere my enemy", + "tokens": [ + 51014, + 823, + 6703, + 452, + 5945, + 51164 + ], + "temperature": 0.4, + "avg_logprob": -0.35596295406943873, + "compression_ratio": 1.8440366972477065, + "no_speech_prob": 0.4185682237148285, + "confidence": 0.679, + "words": [ + { + "text": "Nowhere", + "start": 192.1, + "end": 193.18, + "confidence": 0.658 + }, + { + "text": "my", + "start": 193.18, + "end": 194.08, + "confidence": 0.502 + }, + { + "text": "enemy", + "start": 194.08, + "end": 194.78, + "confidence": 0.979 + } + ] + }, + { + "id": 38, + "seek": 17924, + "start": 195.14, + "end": 198.36, + "text": " Everywhere I swear I'll never be a saint", + "tokens": [ + 51164, + 37322, + 286, + 11902, + 286, + 603, + 1128, + 312, + 257, + 28374, + 51314 + ], + "temperature": 0.4, + "avg_logprob": -0.35596295406943873, + "compression_ratio": 1.8440366972477065, + "no_speech_prob": 0.4185682237148285, + "confidence": 0.994, + "words": [ + { + "text": "Everywhere", + "start": 195.14, + "end": 196.06, + "confidence": 0.973 + }, + { + "text": "I", + "start": 196.06, + "end": 196.5, + "confidence": 0.994 + }, + { + "text": "swear", + "start": 196.5, + "end": 196.78, + "confidence": 0.997 + }, + { + "text": "I'll", + "start": 196.78, + "end": 197.34, + "confidence": 0.995 + }, + { + "text": "never", + "start": 197.34, + "end": 197.56, + "confidence": 0.999 + }, + { + "text": "be", + "start": 197.56, + "end": 197.92, + "confidence": 0.999 + }, + { + "text": "a", + "start": 197.92, + "end": 198.12, + "confidence": 0.998 + }, + { + "text": "saint", + "start": 198.12, + "end": 198.36, + "confidence": 0.993 + } + ] + }, + { + "id": 39, + "seek": 17924, + "start": 198.5, + "end": 199.44, + "text": " Look out for yourself", + "tokens": [ + 51314, + 2053, + 484, + 337, + 1803, + 51414 + ], + "temperature": 0.4, + "avg_logprob": -0.35596295406943873, + "compression_ratio": 1.8440366972477065, + "no_speech_prob": 0.4185682237148285, + "confidence": 0.754, + "words": [ + { + "text": "Look", + "start": 198.5, + "end": 198.74, + "confidence": 0.356 + }, + { + "text": "out", + "start": 198.74, + "end": 198.92, + "confidence": 0.98 + }, + { + "text": "for", + "start": 198.92, + "end": 199.12, + "confidence": 0.97 + }, + { + "text": "yourself", + "start": 199.12, + "end": 199.44, + "confidence": 0.956 + } + ] + } + ], + "language": "en" +} \ No newline at end of file diff --git a/tests/expected/corner_cases/nocond_music.mp4.words.json b/tests/expected/corner_cases/nocond_music.mp4.words.json new file mode 100644 index 0000000000000000000000000000000000000000..9647c5b07f285b8445d88483e2c9bd612e3d7413 --- /dev/null +++ b/tests/expected/corner_cases/nocond_music.mp4.words.json @@ -0,0 +1,2750 @@ +{ + "text": " I Oh, the misery Everybody wants to be my enemy Spare the sympathy Everybody wants to be my enemy Look out for yourself My enemy Look out for yourself But I'm ready Your words up on the wall as you're praying for my phone And the laughter in the holes and the names that I've been called I stack it in my mind and I'm waiting for the time When I show you what it's like to be worse but in the mind Tell you you're the greatest But once you turn they hate us Oh, the misery Everybody wants to be my enemy Spare the sympathy Everybody wants to be my enemy Look out for yourself My enemy Look out for yourself Look, okay I'm hoping that somebody pray for me I'm praying that somebody hold for me. I'm staying where nobody's supposed to be. I propose to be in a wreck of emotions. Ready to go whenever you let me know. The road is long, so put the pedal into the flow. The enemy on my trail, my energy unavailable. I'ma tell them I said away, go away. When I'm plotting, I'ma drive to the top. I've been out of shape, thinking out of the box. I'm an astronaut, blasted off the planet. Rock the cars, catastrophic, and it matters more because I had it now. Had I thought about wreaking havoc on an opposition. Kind of shocking, they want it static. With precision, I'm automatic. Quarterback, I ain't talking second. Pack it, pack it up. I don't panic, better, better. Up who the baddest. it don't matter cause we is your enemy. I swear I'll never be insane You gotta be insane", + "segments": [ + { + "id": 0, + "seek": 0, + "start": 2.24, + "end": 2.36, + "text": " I", + "tokens": [ + 50364, + 286, + 50464 + ], + "temperature": 0.0, + "avg_logprob": -0.9355003237724304, + "compression_ratio": 0.1111111111111111, + "no_speech_prob": 0.7811808586120605, + "confidence": 0.032, + "words": [ + { + "text": "I", + "start": 2.24, + "end": 2.36, + "confidence": 0.032 + } + ] + }, + { + "id": 1, + "seek": 6000, + "start": 60.0, + "end": 69.92, + "text": " Oh, the misery Everybody wants to be my enemy", + "tokens": [ + 50364, + 876, + 11, + 264, + 32309, + 7646, + 2738, + 281, + 312, + 452, + 5945, + 50866 + ], + "temperature": 0.0, + "avg_logprob": -0.45629865472966974, + "compression_ratio": 1.62, + "no_speech_prob": 0.8699213266372681, + "confidence": 0.669, + "words": [ + { + "text": "Oh,", + "start": 60.0, + "end": 63.4, + "confidence": 0.084 + }, + { + "text": "the", + "start": 65.24, + "end": 65.5, + "confidence": 0.797 + }, + { + "text": "misery", + "start": 65.5, + "end": 66.3, + "confidence": 0.993 + }, + { + "text": "Everybody", + "start": 66.3, + "end": 67.7, + "confidence": 0.43 + }, + { + "text": "wants", + "start": 67.7, + "end": 68.08, + "confidence": 0.983 + }, + { + "text": "to", + "start": 68.08, + "end": 68.26, + "confidence": 0.993 + }, + { + "text": "be", + "start": 68.26, + "end": 68.44, + "confidence": 0.996 + }, + { + "text": "my", + "start": 68.44, + "end": 68.74, + "confidence": 0.983 + }, + { + "text": "enemy", + "start": 68.74, + "end": 69.92, + "confidence": 0.984 + } + ] + }, + { + "id": 2, + "seek": 6000, + "start": 70.88, + "end": 76.42, + "text": " Spare the sympathy Everybody wants to be my enemy", + "tokens": [ + 50866, + 1738, + 543, + 264, + 33240, + 7646, + 2738, + 281, + 312, + 452, + 5945, + 51182 + ], + "temperature": 0.0, + "avg_logprob": -0.45629865472966974, + "compression_ratio": 1.62, + "no_speech_prob": 0.8699213266372681, + "confidence": 0.934, + "words": [ + { + "text": "Spare", + "start": 70.88, + "end": 71.54, + "confidence": 0.814 + }, + { + "text": "the", + "start": 71.54, + "end": 71.8, + "confidence": 0.968 + }, + { + "text": "sympathy", + "start": 71.8, + "end": 72.64, + "confidence": 0.993 + }, + { + "text": "Everybody", + "start": 72.64, + "end": 73.96, + "confidence": 0.963 + }, + { + "text": "wants", + "start": 73.96, + "end": 74.3, + "confidence": 0.994 + }, + { + "text": "to", + "start": 74.3, + "end": 74.64, + "confidence": 0.999 + }, + { + "text": "be", + "start": 74.64, + "end": 75.16, + "confidence": 0.999 + }, + { + "text": "my", + "start": 75.16, + "end": 75.72, + "confidence": 0.837 + }, + { + "text": "enemy", + "start": 75.72, + "end": 76.42, + "confidence": 0.997 + } + ] + }, + { + "id": 3, + "seek": 6000, + "start": 79.92, + "end": 82.68, + "text": " Look out for yourself My enemy", + "tokens": [ + 51182, + 2053, + 484, + 337, + 1803, + 1222, + 5945, + 51496 + ], + "temperature": 0.0, + "avg_logprob": -0.45629865472966974, + "compression_ratio": 1.62, + "no_speech_prob": 0.8699213266372681, + "confidence": 0.774, + "words": [ + { + "text": "Look", + "start": 79.92, + "end": 80.24, + "confidence": 0.43 + }, + { + "text": "out", + "start": 80.24, + "end": 80.46, + "confidence": 0.99 + }, + { + "text": "for", + "start": 80.46, + "end": 80.68, + "confidence": 0.989 + }, + { + "text": "yourself", + "start": 80.68, + "end": 81.14, + "confidence": 0.97 + }, + { + "text": "My", + "start": 81.14, + "end": 81.94, + "confidence": 0.536 + }, + { + "text": "enemy", + "start": 81.94, + "end": 82.68, + "confidence": 0.98 + } + ] + }, + { + "id": 4, + "seek": 6000, + "start": 86.14, + "end": 88.48, + "text": " Look out for yourself But I'm ready", + "tokens": [ + 51496, + 2053, + 484, + 337, + 1803, + 583, + 286, + 478, + 1919, + 51792 + ], + "temperature": 0.0, + "avg_logprob": -0.45629865472966974, + "compression_ratio": 1.62, + "no_speech_prob": 0.8699213266372681, + "confidence": 0.928, + "words": [ + { + "text": "Look", + "start": 86.14, + "end": 86.46, + "confidence": 0.748 + }, + { + "text": "out", + "start": 86.46, + "end": 86.68, + "confidence": 0.988 + }, + { + "text": "for", + "start": 86.68, + "end": 86.88, + "confidence": 0.998 + }, + { + "text": "yourself", + "start": 86.88, + "end": 87.56, + "confidence": 0.999 + }, + { + "text": "But", + "start": 87.56, + "end": 87.92, + "confidence": 0.766 + }, + { + "text": "I'm", + "start": 87.92, + "end": 88.14, + "confidence": 0.989 + }, + { + "text": "ready", + "start": 88.14, + "end": 88.48, + "confidence": 0.995 + } + ] + }, + { + "id": 5, + "seek": 8856, + "start": 88.64, + "end": 91.7, + "text": " Your words up on the wall as you're praying for my phone", + "tokens": [ + 50364, + 2260, + 2283, + 493, + 322, + 264, + 2929, + 382, + 291, + 434, + 15611, + 337, + 452, + 2593, + 50520 + ], + "temperature": 0.0, + "avg_logprob": -0.2874426958037586, + "compression_ratio": 1.5869565217391304, + "no_speech_prob": 0.7892544865608215, + "confidence": 0.82, + "words": [ + { + "text": "Your", + "start": 88.64, + "end": 88.86, + "confidence": 0.548 + }, + { + "text": "words", + "start": 88.86, + "end": 89.18, + "confidence": 0.92 + }, + { + "text": "up", + "start": 89.18, + "end": 89.48, + "confidence": 0.964 + }, + { + "text": "on", + "start": 89.48, + "end": 89.62, + "confidence": 0.995 + }, + { + "text": "the", + "start": 89.62, + "end": 89.78, + "confidence": 0.991 + }, + { + "text": "wall", + "start": 89.78, + "end": 90.14, + "confidence": 0.88 + }, + { + "text": "as", + "start": 90.14, + "end": 90.32, + "confidence": 0.402 + }, + { + "text": "you're", + "start": 90.32, + "end": 90.46, + "confidence": 0.828 + }, + { + "text": "praying", + "start": 90.46, + "end": 90.86, + "confidence": 0.967 + }, + { + "text": "for", + "start": 90.86, + "end": 91.1, + "confidence": 0.97 + }, + { + "text": "my", + "start": 91.1, + "end": 91.28, + "confidence": 0.989 + }, + { + "text": "phone", + "start": 91.28, + "end": 91.7, + "confidence": 0.702 + } + ] + }, + { + "id": 6, + "seek": 8856, + "start": 91.78, + "end": 94.74, + "text": " And the laughter in the holes and the names that I've been called", + "tokens": [ + 50520, + 400, + 264, + 13092, + 294, + 264, + 8118, + 293, + 264, + 5288, + 300, + 286, + 600, + 668, + 1219, + 50680 + ], + "temperature": 0.0, + "avg_logprob": -0.2874426958037586, + "compression_ratio": 1.5869565217391304, + "no_speech_prob": 0.7892544865608215, + "confidence": 0.884, + "words": [ + { + "text": "And", + "start": 91.78, + "end": 91.94, + "confidence": 0.844 + }, + { + "text": "the", + "start": 91.94, + "end": 92.12, + "confidence": 0.987 + }, + { + "text": "laughter", + "start": 92.12, + "end": 92.5, + "confidence": 0.994 + }, + { + "text": "in", + "start": 92.5, + "end": 92.72, + "confidence": 0.85 + }, + { + "text": "the", + "start": 92.72, + "end": 92.92, + "confidence": 0.997 + }, + { + "text": "holes", + "start": 92.92, + "end": 93.28, + "confidence": 0.607 + }, + { + "text": "and", + "start": 93.28, + "end": 93.48, + "confidence": 0.595 + }, + { + "text": "the", + "start": 93.48, + "end": 93.6, + "confidence": 0.991 + }, + { + "text": "names", + "start": 93.6, + "end": 93.84, + "confidence": 0.991 + }, + { + "text": "that", + "start": 93.84, + "end": 94.14, + "confidence": 0.957 + }, + { + "text": "I've", + "start": 94.14, + "end": 94.34, + "confidence": 0.914 + }, + { + "text": "been", + "start": 94.34, + "end": 94.46, + "confidence": 0.985 + }, + { + "text": "called", + "start": 94.46, + "end": 94.74, + "confidence": 0.912 + } + ] + }, + { + "id": 7, + "seek": 8856, + "start": 95.0, + "end": 97.82, + "text": " I stack it in my mind and I'm waiting for the time", + "tokens": [ + 50680, + 286, + 8630, + 309, + 294, + 452, + 1575, + 293, + 286, + 478, + 3806, + 337, + 264, + 565, + 50832 + ], + "temperature": 0.0, + "avg_logprob": -0.2874426958037586, + "compression_ratio": 1.5869565217391304, + "no_speech_prob": 0.7892544865608215, + "confidence": 0.959, + "words": [ + { + "text": "I", + "start": 95.0, + "end": 95.14, + "confidence": 0.987 + }, + { + "text": "stack", + "start": 95.14, + "end": 95.46, + "confidence": 0.825 + }, + { + "text": "it", + "start": 95.46, + "end": 95.72, + "confidence": 0.995 + }, + { + "text": "in", + "start": 95.72, + "end": 95.8, + "confidence": 0.996 + }, + { + "text": "my", + "start": 95.8, + "end": 96.1, + "confidence": 0.994 + }, + { + "text": "mind", + "start": 96.1, + "end": 96.4, + "confidence": 0.999 + }, + { + "text": "and", + "start": 96.4, + "end": 96.6, + "confidence": 0.759 + }, + { + "text": "I'm", + "start": 96.6, + "end": 96.72, + "confidence": 0.991 + }, + { + "text": "waiting", + "start": 96.72, + "end": 97.14, + "confidence": 0.988 + }, + { + "text": "for", + "start": 97.14, + "end": 97.36, + "confidence": 0.996 + }, + { + "text": "the", + "start": 97.36, + "end": 97.54, + "confidence": 0.996 + }, + { + "text": "time", + "start": 97.54, + "end": 97.82, + "confidence": 0.996 + } + ] + }, + { + "id": 8, + "seek": 8856, + "start": 97.98, + "end": 101.26, + "text": " When I show you what it's like to be worse but in the mind", + "tokens": [ + 50832, + 1133, + 286, + 855, + 291, + 437, + 309, + 311, + 411, + 281, + 312, + 5324, + 457, + 294, + 264, + 1575, + 51000 + ], + "temperature": 0.0, + "avg_logprob": -0.2874426958037586, + "compression_ratio": 1.5869565217391304, + "no_speech_prob": 0.7892544865608215, + "confidence": 0.756, + "words": [ + { + "text": "When", + "start": 97.98, + "end": 98.14, + "confidence": 0.922 + }, + { + "text": "I", + "start": 98.14, + "end": 98.32, + "confidence": 0.993 + }, + { + "text": "show", + "start": 98.32, + "end": 98.5, + "confidence": 0.958 + }, + { + "text": "you", + "start": 98.5, + "end": 98.76, + "confidence": 0.994 + }, + { + "text": "what", + "start": 98.76, + "end": 98.94, + "confidence": 0.996 + }, + { + "text": "it's", + "start": 98.94, + "end": 99.24, + "confidence": 0.988 + }, + { + "text": "like", + "start": 99.24, + "end": 99.46, + "confidence": 0.998 + }, + { + "text": "to", + "start": 99.46, + "end": 99.7, + "confidence": 0.875 + }, + { + "text": "be", + "start": 99.7, + "end": 99.84, + "confidence": 0.997 + }, + { + "text": "worse", + "start": 99.84, + "end": 100.08, + "confidence": 0.445 + }, + { + "text": "but", + "start": 100.08, + "end": 100.4, + "confidence": 0.199 + }, + { + "text": "in", + "start": 100.4, + "end": 100.58, + "confidence": 0.863 + }, + { + "text": "the", + "start": 100.58, + "end": 100.8, + "confidence": 0.428 + }, + { + "text": "mind", + "start": 100.8, + "end": 101.26, + "confidence": 0.622 + } + ] + }, + { + "id": 9, + "seek": 8856, + "start": 101.34, + "end": 106.84, + "text": " Tell you you're the greatest", + "tokens": [ + 51000, + 5115, + 291, + 291, + 434, + 264, + 6636, + 51292 + ], + "temperature": 0.0, + "avg_logprob": -0.2874426958037586, + "compression_ratio": 1.5869565217391304, + "no_speech_prob": 0.7892544865608215, + "confidence": 0.94, + "words": [ + { + "text": "Tell", + "start": 101.34, + "end": 102.22, + "confidence": 0.937 + }, + { + "text": "you", + "start": 102.22, + "end": 102.96, + "confidence": 0.993 + }, + { + "text": "you're", + "start": 102.96, + "end": 103.94, + "confidence": 0.873 + }, + { + "text": "the", + "start": 103.94, + "end": 104.36, + "confidence": 0.985 + }, + { + "text": "greatest", + "start": 104.36, + "end": 106.84, + "confidence": 0.986 + } + ] + }, + { + "id": 10, + "seek": 8856, + "start": 107.2, + "end": 113.02, + "text": " But once you turn they hate us", + "tokens": [ + 51292, + 583, + 1564, + 291, + 1261, + 436, + 4700, + 505, + 51592 + ], + "temperature": 0.0, + "avg_logprob": -0.2874426958037586, + "compression_ratio": 1.5869565217391304, + "no_speech_prob": 0.7892544865608215, + "confidence": 0.909, + "words": [ + { + "text": "But", + "start": 107.2, + "end": 107.62, + "confidence": 0.963 + }, + { + "text": "once", + "start": 107.62, + "end": 108.42, + "confidence": 0.786 + }, + { + "text": "you", + "start": 108.42, + "end": 109.28, + "confidence": 0.998 + }, + { + "text": "turn", + "start": 109.28, + "end": 109.86, + "confidence": 0.914 + }, + { + "text": "they", + "start": 109.86, + "end": 110.38, + "confidence": 0.754 + }, + { + "text": "hate", + "start": 110.38, + "end": 111.92, + "confidence": 0.984 + }, + { + "text": "us", + "start": 111.92, + "end": 113.02, + "confidence": 0.999 + } + ] + }, + { + "id": 11, + "seek": 11312, + "start": 113.38, + "end": 119.78, + "text": " Oh, the misery Everybody wants to be my enemy", + "tokens": [ + 50364, + 876, + 11, + 264, + 32309, + 7646, + 2738, + 281, + 312, + 452, + 5945, + 50714 + ], + "temperature": 0.0, + "avg_logprob": -0.27150371839415355, + "compression_ratio": 1.6610169491525424, + "no_speech_prob": 0.865480363368988, + "confidence": 0.804, + "words": [ + { + "text": "Oh,", + "start": 113.38, + "end": 114.98, + "confidence": 0.317 + }, + { + "text": "the", + "start": 115.02, + "end": 115.42, + "confidence": 0.964 + }, + { + "text": "misery", + "start": 115.42, + "end": 116.26, + "confidence": 0.995 + }, + { + "text": "Everybody", + "start": 116.26, + "end": 117.58, + "confidence": 0.482 + }, + { + "text": "wants", + "start": 117.58, + "end": 117.96, + "confidence": 0.986 + }, + { + "text": "to", + "start": 117.96, + "end": 118.14, + "confidence": 0.996 + }, + { + "text": "be", + "start": 118.14, + "end": 118.32, + "confidence": 0.998 + }, + { + "text": "my", + "start": 118.32, + "end": 118.56, + "confidence": 0.993 + }, + { + "text": "enemy", + "start": 118.56, + "end": 119.78, + "confidence": 0.983 + } + ] + }, + { + "id": 12, + "seek": 11312, + "start": 120.7, + "end": 126.28, + "text": " Spare the sympathy Everybody wants to be my enemy", + "tokens": [ + 50714, + 1738, + 543, + 264, + 33240, + 7646, + 2738, + 281, + 312, + 452, + 5945, + 51014 + ], + "temperature": 0.0, + "avg_logprob": -0.27150371839415355, + "compression_ratio": 1.6610169491525424, + "no_speech_prob": 0.865480363368988, + "confidence": 0.874, + "words": [ + { + "text": "Spare", + "start": 120.7, + "end": 121.4, + "confidence": 0.576 + }, + { + "text": "the", + "start": 121.4, + "end": 121.7, + "confidence": 0.985 + }, + { + "text": "sympathy", + "start": 121.7, + "end": 122.5, + "confidence": 0.994 + }, + { + "text": "Everybody", + "start": 122.5, + "end": 123.84, + "confidence": 0.969 + }, + { + "text": "wants", + "start": 123.84, + "end": 124.18, + "confidence": 0.994 + }, + { + "text": "to", + "start": 124.18, + "end": 124.42, + "confidence": 0.999 + }, + { + "text": "be", + "start": 124.42, + "end": 125.24, + "confidence": 0.999 + }, + { + "text": "my", + "start": 125.24, + "end": 125.62, + "confidence": 0.836 + }, + { + "text": "enemy", + "start": 125.62, + "end": 126.28, + "confidence": 0.998 + } + ] + }, + { + "id": 13, + "seek": 11312, + "start": 126.62, + "end": 132.44, + "text": " Look out for yourself My enemy", + "tokens": [ + 51014, + 2053, + 484, + 337, + 1803, + 1222, + 5945, + 51314 + ], + "temperature": 0.0, + "avg_logprob": -0.27150371839415355, + "compression_ratio": 1.6610169491525424, + "no_speech_prob": 0.865480363368988, + "confidence": 0.794, + "words": [ + { + "text": "Look", + "start": 126.62, + "end": 130.12, + "confidence": 0.593 + }, + { + "text": "out", + "start": 130.12, + "end": 130.32, + "confidence": 0.893 + }, + { + "text": "for", + "start": 130.32, + "end": 130.48, + "confidence": 0.978 + }, + { + "text": "yourself", + "start": 130.48, + "end": 130.94, + "confidence": 0.988 + }, + { + "text": "My", + "start": 130.94, + "end": 131.78, + "confidence": 0.496 + }, + { + "text": "enemy", + "start": 131.78, + "end": 132.44, + "confidence": 0.989 + } + ] + }, + { + "id": 14, + "seek": 11312, + "start": 133.72, + "end": 137.14, + "text": " Look out for yourself", + "tokens": [ + 51314, + 2053, + 484, + 337, + 1803, + 51564 + ], + "temperature": 0.0, + "avg_logprob": -0.27150371839415355, + "compression_ratio": 1.6610169491525424, + "no_speech_prob": 0.865480363368988, + "confidence": 0.97, + "words": [ + { + "text": "Look", + "start": 133.72, + "end": 134.66, + "confidence": 0.906 + }, + { + "text": "out", + "start": 134.66, + "end": 136.54, + "confidence": 0.978 + }, + { + "text": "for", + "start": 136.54, + "end": 136.74, + "confidence": 0.999 + }, + { + "text": "yourself", + "start": 136.74, + "end": 137.14, + "confidence": 0.999 + } + ] + }, + { + "id": 15, + "seek": 11312, + "start": 137.6, + "end": 140.24, + "text": " Look, okay I'm hoping that somebody pray for me", + "tokens": [ + 51564, + 2053, + 11, + 1392, + 286, + 478, + 7159, + 300, + 2618, + 3690, + 337, + 385, + 51714 + ], + "temperature": 0.0, + "avg_logprob": -0.27150371839415355, + "compression_ratio": 1.6610169491525424, + "no_speech_prob": 0.865480363368988, + "confidence": 0.786, + "words": [ + { + "text": "Look,", + "start": 137.6, + "end": 137.88, + "confidence": 0.728 + }, + { + "text": "okay", + "start": 138.4, + "end": 138.6, + "confidence": 0.728 + }, + { + "text": "I'm", + "start": 138.6, + "end": 138.94, + "confidence": 0.699 + }, + { + "text": "hoping", + "start": 138.94, + "end": 139.16, + "confidence": 0.502 + }, + { + "text": "that", + "start": 139.16, + "end": 139.34, + "confidence": 0.959 + }, + { + "text": "somebody", + "start": 139.34, + "end": 139.58, + "confidence": 0.981 + }, + { + "text": "pray", + "start": 139.58, + "end": 139.84, + "confidence": 0.821 + }, + { + "text": "for", + "start": 139.84, + "end": 140.02, + "confidence": 0.901 + }, + { + "text": "me", + "start": 140.02, + "end": 140.24, + "confidence": 0.999 + } + ] + }, + { + "id": 16, + "seek": 14012, + "start": 140.34, + "end": 141.7, + "text": " I'm praying that somebody hold for me.", + "tokens": [ + 50364, + 286, + 478, + 15611, + 300, + 2618, + 1797, + 337, + 385, + 13, + 50439 + ], + "temperature": 0.0, + "avg_logprob": -0.36420179578993056, + "compression_ratio": 1.7333333333333334, + "no_speech_prob": 0.7754144668579102, + "confidence": 0.794, + "words": [ + { + "text": "I'm", + "start": 140.34, + "end": 140.44, + "confidence": 0.819 + }, + { + "text": "praying", + "start": 140.44, + "end": 140.66, + "confidence": 0.694 + }, + { + "text": "that", + "start": 140.66, + "end": 140.84, + "confidence": 0.787 + }, + { + "text": "somebody", + "start": 140.84, + "end": 141.1, + "confidence": 0.985 + }, + { + "text": "hold", + "start": 141.1, + "end": 141.36, + "confidence": 0.442 + }, + { + "text": "for", + "start": 141.36, + "end": 141.52, + "confidence": 0.992 + }, + { + "text": "me.", + "start": 141.52, + "end": 141.7, + "confidence": 0.999 + } + ] + }, + { + "id": 17, + "seek": 14012, + "start": 141.76, + "end": 143.2, + "text": " I'm staying where nobody's supposed to be.", + "tokens": [ + 50439, + 286, + 478, + 7939, + 689, + 5079, + 311, + 3442, + 281, + 312, + 13, + 50516 + ], + "temperature": 0.0, + "avg_logprob": -0.36420179578993056, + "compression_ratio": 1.7333333333333334, + "no_speech_prob": 0.7754144668579102, + "confidence": 0.853, + "words": [ + { + "text": "I'm", + "start": 141.76, + "end": 141.98, + "confidence": 0.976 + }, + { + "text": "staying", + "start": 141.98, + "end": 142.16, + "confidence": 0.708 + }, + { + "text": "where", + "start": 142.16, + "end": 142.34, + "confidence": 0.906 + }, + { + "text": "nobody's", + "start": 142.34, + "end": 142.68, + "confidence": 0.655 + }, + { + "text": "supposed", + "start": 142.68, + "end": 142.94, + "confidence": 0.923 + }, + { + "text": "to", + "start": 142.94, + "end": 143.1, + "confidence": 0.992 + }, + { + "text": "be.", + "start": 143.1, + "end": 143.2, + "confidence": 0.997 + } + ] + }, + { + "id": 18, + "seek": 14012, + "start": 143.24, + "end": 144.98, + "text": " I propose to be in a wreck of emotions.", + "tokens": [ + 50516, + 286, + 17421, + 281, + 312, + 294, + 257, + 21478, + 295, + 8462, + 13, + 50610 + ], + "temperature": 0.0, + "avg_logprob": -0.36420179578993056, + "compression_ratio": 1.7333333333333334, + "no_speech_prob": 0.7754144668579102, + "confidence": 0.646, + "words": [ + { + "text": "I", + "start": 143.24, + "end": 143.42, + "confidence": 0.492 + }, + { + "text": "propose", + "start": 143.42, + "end": 143.72, + "confidence": 0.333 + }, + { + "text": "to", + "start": 143.72, + "end": 143.88, + "confidence": 0.778 + }, + { + "text": "be", + "start": 143.88, + "end": 144.02, + "confidence": 0.442 + }, + { + "text": "in", + "start": 144.02, + "end": 144.18, + "confidence": 0.812 + }, + { + "text": "a", + "start": 144.18, + "end": 144.28, + "confidence": 0.559 + }, + { + "text": "wreck", + "start": 144.28, + "end": 144.4, + "confidence": 0.811 + }, + { + "text": "of", + "start": 144.4, + "end": 144.54, + "confidence": 0.99 + }, + { + "text": "emotions.", + "start": 144.54, + "end": 144.98, + "confidence": 0.953 + } + ] + }, + { + "id": 19, + "seek": 14012, + "start": 145.06, + "end": 146.3, + "text": " Ready to go whenever you let me know.", + "tokens": [ + 50610, + 9944, + 281, + 352, + 5699, + 291, + 718, + 385, + 458, + 13, + 50672 + ], + "temperature": 0.0, + "avg_logprob": -0.36420179578993056, + "compression_ratio": 1.7333333333333334, + "no_speech_prob": 0.7754144668579102, + "confidence": 0.834, + "words": [ + { + "text": "Ready", + "start": 145.06, + "end": 145.3, + "confidence": 0.951 + }, + { + "text": "to", + "start": 145.3, + "end": 145.46, + "confidence": 0.997 + }, + { + "text": "go", + "start": 145.46, + "end": 145.6, + "confidence": 0.997 + }, + { + "text": "whenever", + "start": 145.6, + "end": 145.78, + "confidence": 0.661 + }, + { + "text": "you", + "start": 145.78, + "end": 145.94, + "confidence": 0.403 + }, + { + "text": "let", + "start": 145.94, + "end": 146.08, + "confidence": 0.952 + }, + { + "text": "me", + "start": 146.08, + "end": 146.18, + "confidence": 0.998 + }, + { + "text": "know.", + "start": 146.18, + "end": 146.3, + "confidence": 0.977 + } + ] + }, + { + "id": 20, + "seek": 14012, + "start": 146.36, + "end": 147.88, + "text": " The road is long, so put the pedal into the flow.", + "tokens": [ + 50672, + 440, + 3060, + 307, + 938, + 11, + 370, + 829, + 264, + 19122, + 666, + 264, + 3095, + 13, + 50749 + ], + "temperature": 0.0, + "avg_logprob": -0.36420179578993056, + "compression_ratio": 1.7333333333333334, + "no_speech_prob": 0.7754144668579102, + "confidence": 0.959, + "words": [ + { + "text": "The", + "start": 146.36, + "end": 146.52, + "confidence": 0.99 + }, + { + "text": "road", + "start": 146.52, + "end": 146.68, + "confidence": 0.99 + }, + { + "text": "is", + "start": 146.68, + "end": 146.78, + "confidence": 0.987 + }, + { + "text": "long,", + "start": 146.78, + "end": 146.9, + "confidence": 0.961 + }, + { + "text": "so", + "start": 146.92, + "end": 147.02, + "confidence": 0.968 + }, + { + "text": "put", + "start": 147.02, + "end": 147.16, + "confidence": 0.954 + }, + { + "text": "the", + "start": 147.16, + "end": 147.28, + "confidence": 0.972 + }, + { + "text": "pedal", + "start": 147.28, + "end": 147.4, + "confidence": 0.993 + }, + { + "text": "into", + "start": 147.4, + "end": 147.6, + "confidence": 0.9 + }, + { + "text": "the", + "start": 147.6, + "end": 147.76, + "confidence": 0.992 + }, + { + "text": "flow.", + "start": 147.76, + "end": 147.88, + "confidence": 0.856 + } + ] + }, + { + "id": 21, + "seek": 14012, + "start": 147.94, + "end": 149.78, + "text": " The enemy on my trail, my energy unavailable.", + "tokens": [ + 50749, + 440, + 5945, + 322, + 452, + 9924, + 11, + 452, + 2281, + 36541, + 32699, + 13, + 50856 + ], + "temperature": 0.0, + "avg_logprob": -0.36420179578993056, + "compression_ratio": 1.7333333333333334, + "no_speech_prob": 0.7754144668579102, + "confidence": 0.948, + "words": [ + { + "text": "The", + "start": 147.94, + "end": 148.08, + "confidence": 0.968 + }, + { + "text": "enemy", + "start": 148.08, + "end": 148.26, + "confidence": 0.726 + }, + { + "text": "on", + "start": 148.26, + "end": 148.38, + "confidence": 0.974 + }, + { + "text": "my", + "start": 148.38, + "end": 148.5, + "confidence": 0.974 + }, + { + "text": "trail,", + "start": 148.5, + "end": 148.64, + "confidence": 0.986 + }, + { + "text": "my", + "start": 148.68, + "end": 148.86, + "confidence": 0.99 + }, + { + "text": "energy", + "start": 148.86, + "end": 149.1, + "confidence": 0.996 + }, + { + "text": "unavailable.", + "start": 149.1, + "end": 149.78, + "confidence": 0.978 + } + ] + }, + { + "id": 22, + "seek": 14012, + "start": 150.0, + "end": 151.35, + "text": " I'ma tell them I said away, go away.", + "tokens": [ + 50856, + 286, + 478, + 64, + 980, + 552, + 286, + 848, + 1314, + 11, + 352, + 1314, + 13, + 50924 + ], + "temperature": 0.0, + "avg_logprob": -0.36420179578993056, + "compression_ratio": 1.7333333333333334, + "no_speech_prob": 0.7754144668579102, + "confidence": 0.571, + "words": [ + { + "text": "I'ma", + "start": 150.0, + "end": 150.26, + "confidence": 0.765 + }, + { + "text": "tell", + "start": 150.26, + "end": 150.36, + "confidence": 0.989 + }, + { + "text": "them", + "start": 150.36, + "end": 150.5, + "confidence": 0.335 + }, + { + "text": "I", + "start": 150.5, + "end": 150.62, + "confidence": 0.359 + }, + { + "text": "said", + "start": 150.62, + "end": 150.76, + "confidence": 0.3 + }, + { + "text": "away,", + "start": 150.76, + "end": 151.0, + "confidence": 0.325 + }, + { + "text": "go", + "start": 151.14, + "end": 151.18, + "confidence": 0.911 + }, + { + "text": "away.", + "start": 151.18, + "end": 151.35, + "confidence": 0.781 + } + ] + }, + { + "id": 23, + "seek": 14012, + "start": 151.35, + "end": 152.55, + "text": " When I'm plotting, I'ma drive to the top.", + "tokens": [ + 50924, + 1133, + 286, + 478, + 41178, + 11, + 286, + 478, + 64, + 3332, + 281, + 264, + 1192, + 13, + 50985 + ], + "temperature": 0.0, + "avg_logprob": -0.36420179578993056, + "compression_ratio": 1.7333333333333334, + "no_speech_prob": 0.7754144668579102, + "confidence": 0.644, + "words": [ + { + "text": "When", + "start": 151.35, + "end": 151.56, + "confidence": 0.886 + }, + { + "text": "I'm", + "start": 151.56, + "end": 151.72, + "confidence": 0.592 + }, + { + "text": "plotting,", + "start": 151.72, + "end": 151.82, + "confidence": 0.365 + }, + { + "text": "I'ma", + "start": 151.84, + "end": 152.0, + "confidence": 0.487 + }, + { + "text": "drive", + "start": 152.0, + "end": 152.16, + "confidence": 0.622 + }, + { + "text": "to", + "start": 152.16, + "end": 152.3, + "confidence": 0.984 + }, + { + "text": "the", + "start": 152.3, + "end": 152.42, + "confidence": 0.997 + }, + { + "text": "top.", + "start": 152.42, + "end": 152.55, + "confidence": 0.999 + } + ] + }, + { + "id": 24, + "seek": 14012, + "start": 152.55, + "end": 153.74, + "text": " I've been out of shape, thinking out of the box.", + "tokens": [ + 50985, + 286, + 600, + 668, + 484, + 295, + 3909, + 11, + 1953, + 484, + 295, + 264, + 2424, + 13, + 51043 + ], + "temperature": 0.0, + "avg_logprob": -0.36420179578993056, + "compression_ratio": 1.7333333333333334, + "no_speech_prob": 0.7754144668579102, + "confidence": 0.769, + "words": [ + { + "text": "I've", + "start": 152.55, + "end": 152.7, + "confidence": 0.723 + }, + { + "text": "been", + "start": 152.7, + "end": 152.78, + "confidence": 0.998 + }, + { + "text": "out", + "start": 152.78, + "end": 152.9, + "confidence": 0.905 + }, + { + "text": "of", + "start": 152.9, + "end": 153.02, + "confidence": 0.986 + }, + { + "text": "shape,", + "start": 153.02, + "end": 153.1, + "confidence": 0.998 + }, + { + "text": "thinking", + "start": 153.26, + "end": 153.32, + "confidence": 0.842 + }, + { + "text": "out", + "start": 153.32, + "end": 153.46, + "confidence": 0.343 + }, + { + "text": "of", + "start": 153.46, + "end": 153.56, + "confidence": 0.505 + }, + { + "text": "the", + "start": 153.56, + "end": 153.62, + "confidence": 0.82 + }, + { + "text": "box.", + "start": 153.62, + "end": 153.74, + "confidence": 0.998 + } + ] + }, + { + "id": 25, + "seek": 14012, + "start": 153.74, + "end": 155.34, + "text": " I'm an astronaut, blasted off the planet.", + "tokens": [ + 51043, + 286, + 478, + 364, + 18516, + 11, + 12035, + 292, + 766, + 264, + 5054, + 13, + 51124 + ], + "temperature": 0.0, + "avg_logprob": -0.36420179578993056, + "compression_ratio": 1.7333333333333334, + "no_speech_prob": 0.7754144668579102, + "confidence": 0.967, + "words": [ + { + "text": "I'm", + "start": 153.74, + "end": 153.92, + "confidence": 0.996 + }, + { + "text": "an", + "start": 153.92, + "end": 154.06, + "confidence": 0.996 + }, + { + "text": "astronaut,", + "start": 154.06, + "end": 154.4, + "confidence": 0.991 + }, + { + "text": "blasted", + "start": 154.54, + "end": 154.88, + "confidence": 0.895 + }, + { + "text": "off", + "start": 154.88, + "end": 155.02, + "confidence": 0.987 + }, + { + "text": "the", + "start": 155.02, + "end": 155.18, + "confidence": 0.959 + }, + { + "text": "planet.", + "start": 155.18, + "end": 155.34, + "confidence": 0.997 + } + ] + }, + { + "id": 26, + "seek": 14012, + "start": 155.4, + "end": 157.18, + "text": " Rock the cars, catastrophic, and it matters more", + "tokens": [ + 51124, + 6922, + 264, + 5163, + 11, + 34915, + 11, + 293, + 309, + 7001, + 544, + 51212 + ], + "temperature": 0.0, + "avg_logprob": -0.36420179578993056, + "compression_ratio": 1.7333333333333334, + "no_speech_prob": 0.7754144668579102, + "confidence": 0.703, + "words": [ + { + "text": "Rock", + "start": 155.4, + "end": 155.6, + "confidence": 0.564 + }, + { + "text": "the", + "start": 155.6, + "end": 155.74, + "confidence": 0.505 + }, + { + "text": "cars,", + "start": 155.74, + "end": 155.88, + "confidence": 0.47 + }, + { + "text": "catastrophic,", + "start": 155.9, + "end": 156.4, + "confidence": 0.771 + }, + { + "text": "and", + "start": 156.46, + "end": 156.62, + "confidence": 0.925 + }, + { + "text": "it", + "start": 156.62, + "end": 156.76, + "confidence": 0.733 + }, + { + "text": "matters", + "start": 156.76, + "end": 156.94, + "confidence": 0.878 + }, + { + "text": "more", + "start": 156.94, + "end": 157.18, + "confidence": 0.974 + } + ] + }, + { + "id": 27, + "seek": 14012, + "start": 157.18, + "end": 157.91, + "text": " because I had it now.", + "tokens": [ + 51212, + 570, + 286, + 632, + 309, + 586, + 13, + 51254 + ], + "temperature": 0.0, + "avg_logprob": -0.36420179578993056, + "compression_ratio": 1.7333333333333334, + "no_speech_prob": 0.7754144668579102, + "confidence": 0.649, + "words": [ + { + "text": "because", + "start": 157.18, + "end": 157.42, + "confidence": 0.99 + }, + { + "text": "I", + "start": 157.42, + "end": 157.56, + "confidence": 0.532 + }, + { + "text": "had", + "start": 157.56, + "end": 157.66, + "confidence": 0.936 + }, + { + "text": "it", + "start": 157.66, + "end": 157.82, + "confidence": 0.984 + }, + { + "text": "now.", + "start": 157.82, + "end": 157.91, + "confidence": 0.237 + } + ] + }, + { + "id": 28, + "seek": 14012, + "start": 157.91, + "end": 159.84, + "text": " Had I thought about wreaking havoc on an opposition.", + "tokens": [ + 51254, + 12298, + 286, + 1194, + 466, + 46674, + 2456, + 47367, + 322, + 364, + 13504, + 13, + 51350 + ], + "temperature": 0.0, + "avg_logprob": -0.36420179578993056, + "compression_ratio": 1.7333333333333334, + "no_speech_prob": 0.7754144668579102, + "confidence": 0.954, + "words": [ + { + "text": "Had", + "start": 157.91, + "end": 158.12, + "confidence": 0.843 + }, + { + "text": "I", + "start": 158.12, + "end": 158.2, + "confidence": 0.971 + }, + { + "text": "thought", + "start": 158.2, + "end": 158.38, + "confidence": 0.991 + }, + { + "text": "about", + "start": 158.38, + "end": 158.58, + "confidence": 0.995 + }, + { + "text": "wreaking", + "start": 158.58, + "end": 158.86, + "confidence": 0.996 + }, + { + "text": "havoc", + "start": 158.86, + "end": 159.08, + "confidence": 1.0 + }, + { + "text": "on", + "start": 159.08, + "end": 159.32, + "confidence": 0.862 + }, + { + "text": "an", + "start": 159.32, + "end": 159.46, + "confidence": 0.913 + }, + { + "text": "opposition.", + "start": 159.46, + "end": 159.84, + "confidence": 0.991 + } + ] + }, + { + "id": 29, + "seek": 14012, + "start": 159.86, + "end": 161.02, + "text": " Kind of shocking, they want it static.", + "tokens": [ + 51350, + 9242, + 295, + 18776, + 11, + 436, + 528, + 309, + 13437, + 13, + 51410 + ], + "temperature": 0.0, + "avg_logprob": -0.36420179578993056, + "compression_ratio": 1.7333333333333334, + "no_speech_prob": 0.7754144668579102, + "confidence": 0.667, + "words": [ + { + "text": "Kind", + "start": 159.86, + "end": 160.06, + "confidence": 0.661 + }, + { + "text": "of", + "start": 160.06, + "end": 160.18, + "confidence": 0.995 + }, + { + "text": "shocking,", + "start": 160.18, + "end": 160.38, + "confidence": 0.656 + }, + { + "text": "they", + "start": 160.52, + "end": 160.6, + "confidence": 0.366 + }, + { + "text": "want", + "start": 160.6, + "end": 160.74, + "confidence": 0.574 + }, + { + "text": "it", + "start": 160.74, + "end": 160.88, + "confidence": 0.651 + }, + { + "text": "static.", + "start": 160.88, + "end": 161.02, + "confidence": 0.993 + } + ] + }, + { + "id": 30, + "seek": 14012, + "start": 161.08, + "end": 162.18, + "text": " With precision, I'm automatic.", + "tokens": [ + 51410, + 2022, + 18356, + 11, + 286, + 478, + 12509, + 13, + 51468 + ], + "temperature": 0.0, + "avg_logprob": -0.36420179578993056, + "compression_ratio": 1.7333333333333334, + "no_speech_prob": 0.7754144668579102, + "confidence": 0.874, + "words": [ + { + "text": "With", + "start": 161.08, + "end": 161.28, + "confidence": 0.587 + }, + { + "text": "precision,", + "start": 161.28, + "end": 161.58, + "confidence": 0.904 + }, + { + "text": "I'm", + "start": 161.68, + "end": 161.88, + "confidence": 0.987 + }, + { + "text": "automatic.", + "start": 161.88, + "end": 162.18, + "confidence": 0.987 + } + ] + }, + { + "id": 31, + "seek": 14012, + "start": 162.24, + "end": 163.34, + "text": " Quarterback, I ain't talking second.", + "tokens": [ + 51468, + 43794, + 3207, + 11, + 286, + 7862, + 380, + 1417, + 1150, + 13, + 51527 + ], + "temperature": 0.0, + "avg_logprob": -0.36420179578993056, + "compression_ratio": 1.7333333333333334, + "no_speech_prob": 0.7754144668579102, + "confidence": 0.687, + "words": [ + { + "text": "Quarterback,", + "start": 162.24, + "end": 162.66, + "confidence": 0.511 + }, + { + "text": "I", + "start": 162.66, + "end": 162.78, + "confidence": 0.964 + }, + { + "text": "ain't", + "start": 162.78, + "end": 162.9, + "confidence": 0.99 + }, + { + "text": "talking", + "start": 162.9, + "end": 163.1, + "confidence": 0.891 + }, + { + "text": "second.", + "start": 163.1, + "end": 163.34, + "confidence": 0.327 + } + ] + }, + { + "id": 32, + "seek": 14012, + "start": 163.36, + "end": 164.12, + "text": " Pack it, pack it up.", + "tokens": [ + 51527, + 18466, + 309, + 11, + 2844, + 309, + 493, + 13, + 51562 + ], + "temperature": 0.0, + "avg_logprob": -0.36420179578993056, + "compression_ratio": 1.7333333333333334, + "no_speech_prob": 0.7754144668579102, + "confidence": 0.973, + "words": [ + { + "text": "Pack", + "start": 163.36, + "end": 163.62, + "confidence": 0.967 + }, + { + "text": "it,", + "start": 163.62, + "end": 163.68, + "confidence": 0.937 + }, + { + "text": "pack", + "start": 163.68, + "end": 163.88, + "confidence": 0.986 + }, + { + "text": "it", + "start": 163.88, + "end": 164.0, + "confidence": 0.999 + }, + { + "text": "up.", + "start": 164.0, + "end": 164.12, + "confidence": 0.979 + } + ] + }, + { + "id": 33, + "seek": 14012, + "start": 164.12, + "end": 165.04, + "text": " I don't panic, better, better.", + "tokens": [ + 51562, + 286, + 500, + 380, + 14783, + 11, + 1101, + 11, + 1101, + 13, + 51612 + ], + "temperature": 0.0, + "avg_logprob": -0.36420179578993056, + "compression_ratio": 1.7333333333333334, + "no_speech_prob": 0.7754144668579102, + "confidence": 0.76, + "words": [ + { + "text": "I", + "start": 164.12, + "end": 164.18, + "confidence": 0.984 + }, + { + "text": "don't", + "start": 164.18, + "end": 164.34, + "confidence": 0.912 + }, + { + "text": "panic,", + "start": 164.34, + "end": 164.58, + "confidence": 0.999 + }, + { + "text": "better,", + "start": 164.6, + "end": 164.86, + "confidence": 0.424 + }, + { + "text": "better.", + "start": 164.86, + "end": 165.04, + "confidence": 0.555 + } + ] + }, + { + "id": 34, + "seek": 14012, + "start": 165.14, + "end": 165.74, + "text": " Up who the baddest.", + "tokens": [ + 51612, + 5858, + 567, + 264, + 1578, + 23748, + 13, + 51644 + ], + "temperature": 0.0, + "avg_logprob": -0.36420179578993056, + "compression_ratio": 1.7333333333333334, + "no_speech_prob": 0.7754144668579102, + "confidence": 0.75, + "words": [ + { + "text": "Up", + "start": 165.14, + "end": 165.28, + "confidence": 0.517 + }, + { + "text": "who", + "start": 165.28, + "end": 165.4, + "confidence": 0.747 + }, + { + "text": "the", + "start": 165.4, + "end": 165.54, + "confidence": 0.926 + }, + { + "text": "baddest.", + "start": 165.54, + "end": 165.74, + "confidence": 0.816 + } + ] + }, + { + "id": 35, + "seek": 16572, + "start": 165.74, + "end": 166.84, + "text": " it don't matter cause we is your enemy.", + "tokens": [ + 50364, + 309, + 500, + 380, + 1871, + 3082, + 321, + 307, + 428, + 5945, + 13, + 50414 + ], + "temperature": 0.0, + "avg_logprob": -0.9108315981351413, + "compression_ratio": 0.8297872340425532, + "no_speech_prob": 0.6954025626182556, + "confidence": 0.447, + "words": [ + { + "text": "it", + "start": 165.74, + "end": 165.88, + "confidence": 0.125 + }, + { + "text": "don't", + "start": 165.88, + "end": 166.06, + "confidence": 0.825 + }, + { + "text": "matter", + "start": 166.06, + "end": 166.22, + "confidence": 0.996 + }, + { + "text": "cause", + "start": 166.22, + "end": 166.4, + "confidence": 0.287 + }, + { + "text": "we", + "start": 166.4, + "end": 166.56, + "confidence": 0.889 + }, + { + "text": "is", + "start": 166.56, + "end": 166.66, + "confidence": 0.229 + }, + { + "text": "your", + "start": 166.66, + "end": 166.76, + "confidence": 0.561 + }, + { + "text": "enemy.", + "start": 166.76, + "end": 166.84, + "confidence": 0.257 + } + ] + }, + { + "id": 36, + "seek": 19572, + "start": 195.72, + "end": 198.2, + "text": " I swear I'll never be insane", + "tokens": [ + 50364, + 286, + 11902, + 286, + 603, + 1128, + 312, + 10838, + 50464 + ], + "temperature": 0.0, + "avg_logprob": -0.5534874200820923, + "compression_ratio": 1.0, + "no_speech_prob": 0.6747308969497681, + "confidence": 0.773, + "words": [ + { + "text": "I", + "start": 195.72, + "end": 196.38, + "confidence": 0.745 + }, + { + "text": "swear", + "start": 196.38, + "end": 196.74, + "confidence": 0.963 + }, + { + "text": "I'll", + "start": 196.74, + "end": 197.18, + "confidence": 0.665 + }, + { + "text": "never", + "start": 197.18, + "end": 197.58, + "confidence": 0.997 + }, + { + "text": "be", + "start": 197.58, + "end": 197.92, + "confidence": 0.994 + }, + { + "text": "insane", + "start": 197.92, + "end": 198.2, + "confidence": 0.525 + } + ] + }, + { + "id": 37, + "seek": 19572, + "start": 198.5, + "end": 199.38, + "text": " You gotta be insane", + "tokens": [ + 50464, + 509, + 3428, + 312, + 10838, + 50564 + ], + "temperature": 0.0, + "avg_logprob": -0.5534874200820923, + "compression_ratio": 1.0, + "no_speech_prob": 0.6747308969497681, + "confidence": 0.492, + "words": [ + { + "text": "You", + "start": 198.5, + "end": 198.7, + "confidence": 0.4 + }, + { + "text": "gotta", + "start": 198.7, + "end": 198.88, + "confidence": 0.268 + }, + { + "text": "be", + "start": 198.88, + "end": 199.12, + "confidence": 0.959 + }, + { + "text": "insane", + "start": 199.12, + "end": 199.38, + "confidence": 0.568 + } + ] + } + ], + "language": "en" +} \ No newline at end of file diff --git a/tests/expected/corner_cases/random.nocond_apollo11.mp3.words.json b/tests/expected/corner_cases/random.nocond_apollo11.mp3.words.json new file mode 100644 index 0000000000000000000000000000000000000000..6d0775c1c9b63b2413a5180c6c157f59125fe90b --- /dev/null +++ b/tests/expected/corner_cases/random.nocond_apollo11.mp3.words.json @@ -0,0 +1,2003 @@ +{ + "text": " Apollo 11, Houston we got a recommendation for you on your Soyuz-VA GLEME GVA. Alright, okay, we like the... Yeah, I'll put that there, my friend. They make the one that's on the helmet we were going to have in B1. And you can put the other one on the mic helmet with those GVA flipper strings. I got them. I got them. They're the better now. They're the one that got the one right there. They're going to the leak reshaping. We got them in there. I got them in bags. And I just... Yeah. I got them in the album bags. At least it's in the album bags. Right here. Right here. Yeah, we're taking Nick and me out. Yeah, we're thinking next week on a... You know, we were... We were going to hang with the cover, I tried it already. Okay, fine, we weren't sure of that, just a suggestion. We thought we'd... you could check it out. I'm not sure if you've already done that. So, I guess we're going to come up with this, let us know. Okay, no problem. Okay, no problem. We'll let you know when the end of the... ...sun. Bye.", + "segments": [ + { + "id": 0, + "seek": 0, + "start": 0.52, + "end": 6.54, + "text": " Apollo 11, Houston we got a recommendation for you on your Soyuz-VA GLEME GVA.", + "tokens": [ + 50364, + 25187, + 2975, + 11, + 18717, + 321, + 658, + 257, + 11879, + 337, + 291, + 322, + 428, + 24758, + 3334, + 12, + 20914, + 460, + 2634, + 15454, + 460, + 20914, + 13, + 50714 + ], + "temperature": 0.1, + "avg_logprob": -0.7576699998643663, + "compression_ratio": 1.4202898550724639, + "no_speech_prob": 0.44998496770858765, + "confidence": 0.541, + "words": [ + { + "text": "Apollo", + "start": 0.52, + "end": 0.88, + "confidence": 0.155 + }, + { + "text": "11,", + "start": 0.88, + "end": 1.26, + "confidence": 0.977 + }, + { + "text": "Houston", + "start": 1.52, + "end": 1.72, + "confidence": 0.986 + }, + { + "text": "we", + "start": 1.72, + "end": 1.94, + "confidence": 0.518 + }, + { + "text": "got", + "start": 1.94, + "end": 2.1, + "confidence": 0.823 + }, + { + "text": "a", + "start": 2.1, + "end": 2.26, + "confidence": 0.989 + }, + { + "text": "recommendation", + "start": 2.26, + "end": 2.86, + "confidence": 0.968 + }, + { + "text": "for", + "start": 2.86, + "end": 3.44, + "confidence": 0.946 + }, + { + "text": "you", + "start": 3.44, + "end": 3.6, + "confidence": 0.984 + }, + { + "text": "on", + "start": 3.6, + "end": 3.72, + "confidence": 0.909 + }, + { + "text": "your", + "start": 3.72, + "end": 3.92, + "confidence": 0.971 + }, + { + "text": "Soyuz-VA", + "start": 3.92, + "end": 5.16, + "confidence": 0.26 + }, + { + "text": "GLEME", + "start": 5.16, + "end": 5.74, + "confidence": 0.475 + }, + { + "text": "GVA.", + "start": 5.74, + "end": 6.54, + "confidence": 0.435 + } + ] + }, + { + "id": 1, + "seek": 0, + "start": 10.8, + "end": 13.48, + "text": " Alright, okay, we like the...", + "tokens": [ + 50714, + 2798, + 11, + 1392, + 11, + 321, + 411, + 264, + 485, + 51014 + ], + "temperature": 0.1, + "avg_logprob": -0.7576699998643663, + "compression_ratio": 1.4202898550724639, + "no_speech_prob": 0.44998496770858765, + "confidence": 0.412, + "words": [ + { + "text": "Alright,", + "start": 10.8, + "end": 11.04, + "confidence": 0.31 + }, + { + "text": "okay,", + "start": 11.68, + "end": 12.22, + "confidence": 0.504 + }, + { + "text": "we", + "start": 12.5, + "end": 12.98, + "confidence": 0.609 + }, + { + "text": "like", + "start": 12.98, + "end": 13.26, + "confidence": 0.505 + }, + { + "text": "the...", + "start": 13.26, + "end": 13.48, + "confidence": 0.247 + } + ] + }, + { + "id": 2, + "seek": 0, + "start": 13.48, + "end": 14.6, + "text": " Yeah, I'll put that there, my friend.", + "tokens": [ + 51014, + 865, + 11, + 286, + 603, + 829, + 300, + 456, + 11, + 452, + 1277, + 13, + 51114 + ], + "temperature": 0.1, + "avg_logprob": -0.7576699998643663, + "compression_ratio": 1.4202898550724639, + "no_speech_prob": 0.44998496770858765, + "confidence": 0.218, + "words": [ + { + "text": "Yeah,", + "start": 13.48, + "end": 13.5, + "confidence": 0.281 + }, + { + "text": "I'll", + "start": 13.5, + "end": 13.78, + "confidence": 0.195 + }, + { + "text": "put", + "start": 13.78, + "end": 13.96, + "confidence": 0.206 + }, + { + "text": "that", + "start": 13.96, + "end": 14.12, + "confidence": 0.86 + }, + { + "text": "there,", + "start": 14.12, + "end": 14.38, + "confidence": 0.325 + }, + { + "text": "my", + "start": 14.4, + "end": 14.54, + "confidence": 0.095 + }, + { + "text": "friend.", + "start": 14.54, + "end": 14.6, + "confidence": 0.088 + } + ] + }, + { + "id": 3, + "seek": 0, + "start": 14.6, + "end": 19.08, + "text": " They make the one that's on the helmet we were going to have in B1.", + "tokens": [ + 51114, + 814, + 652, + 264, + 472, + 300, + 311, + 322, + 264, + 15922, + 321, + 645, + 516, + 281, + 362, + 294, + 363, + 16, + 13, + 51314 + ], + "temperature": 0.1, + "avg_logprob": -0.7576699998643663, + "compression_ratio": 1.4202898550724639, + "no_speech_prob": 0.44998496770858765, + "confidence": 0.6, + "words": [ + { + "text": "They", + "start": 14.6, + "end": 15.46, + "confidence": 0.366 + }, + { + "text": "make", + "start": 15.46, + "end": 15.68, + "confidence": 0.458 + }, + { + "text": "the", + "start": 15.68, + "end": 15.84, + "confidence": 0.354 + }, + { + "text": "one", + "start": 15.84, + "end": 16.06, + "confidence": 0.71 + }, + { + "text": "that's", + "start": 16.06, + "end": 16.28, + "confidence": 0.572 + }, + { + "text": "on", + "start": 16.28, + "end": 16.48, + "confidence": 0.636 + }, + { + "text": "the", + "start": 16.48, + "end": 16.78, + "confidence": 0.858 + }, + { + "text": "helmet", + "start": 16.78, + "end": 17.26, + "confidence": 0.892 + }, + { + "text": "we", + "start": 17.26, + "end": 17.52, + "confidence": 0.185 + }, + { + "text": "were", + "start": 17.52, + "end": 17.78, + "confidence": 0.529 + }, + { + "text": "going", + "start": 17.78, + "end": 17.92, + "confidence": 0.55 + }, + { + "text": "to", + "start": 17.92, + "end": 17.98, + "confidence": 0.984 + }, + { + "text": "have", + "start": 17.98, + "end": 18.2, + "confidence": 0.958 + }, + { + "text": "in", + "start": 18.2, + "end": 18.38, + "confidence": 0.844 + }, + { + "text": "B1.", + "start": 18.38, + "end": 19.08, + "confidence": 0.765 + } + ] + }, + { + "id": 4, + "seek": 0, + "start": 20.12, + "end": 24.52, + "text": " And you can put the other one on the mic helmet with those GVA flipper strings.", + "tokens": [ + 51314, + 400, + 291, + 393, + 829, + 264, + 661, + 472, + 322, + 264, + 3123, + 15922, + 365, + 729, + 460, + 20914, + 932, + 15124, + 13985, + 13, + 51614 + ], + "temperature": 0.1, + "avg_logprob": -0.7576699998643663, + "compression_ratio": 1.4202898550724639, + "no_speech_prob": 0.44998496770858765, + "confidence": 0.468, + "words": [ + { + "text": "And", + "start": 20.12, + "end": 20.16, + "confidence": 0.534 + }, + { + "text": "you", + "start": 20.16, + "end": 20.32, + "confidence": 0.942 + }, + { + "text": "can", + "start": 20.32, + "end": 20.48, + "confidence": 0.74 + }, + { + "text": "put", + "start": 20.48, + "end": 20.64, + "confidence": 0.992 + }, + { + "text": "the", + "start": 20.64, + "end": 20.84, + "confidence": 0.99 + }, + { + "text": "other", + "start": 20.84, + "end": 21.0, + "confidence": 0.993 + }, + { + "text": "one", + "start": 21.0, + "end": 21.18, + "confidence": 0.982 + }, + { + "text": "on", + "start": 21.18, + "end": 21.42, + "confidence": 0.989 + }, + { + "text": "the", + "start": 21.42, + "end": 21.94, + "confidence": 0.462 + }, + { + "text": "mic", + "start": 21.94, + "end": 22.48, + "confidence": 0.384 + }, + { + "text": "helmet", + "start": 22.48, + "end": 22.8, + "confidence": 0.89 + }, + { + "text": "with", + "start": 22.8, + "end": 23.06, + "confidence": 0.436 + }, + { + "text": "those", + "start": 23.06, + "end": 23.3, + "confidence": 0.45 + }, + { + "text": "GVA", + "start": 23.3, + "end": 23.74, + "confidence": 0.222 + }, + { + "text": "flipper", + "start": 23.74, + "end": 24.18, + "confidence": 0.103 + }, + { + "text": "strings.", + "start": 24.18, + "end": 24.52, + "confidence": 0.207 + } + ] + }, + { + "id": 5, + "seek": 2500, + "start": 31.32, + "end": 34.03, + "text": " I got them. I got them. They're the better now.", + "tokens": [ + 50364, + 286, + 658, + 552, + 13, + 286, + 658, + 552, + 13, + 814, + 434, + 264, + 1101, + 586, + 13, + 50814 + ], + "temperature": 0.1, + "avg_logprob": -0.7381767340465984, + "compression_ratio": 1.920731707317073, + "no_speech_prob": 0.8235840797424316, + "confidence": 0.45, + "words": [ + { + "text": "I", + "start": 31.32, + "end": 31.52, + "confidence": 0.121 + }, + { + "text": "got", + "start": 31.52, + "end": 31.82, + "confidence": 0.464 + }, + { + "text": "them.", + "start": 31.82, + "end": 32.12, + "confidence": 0.264 + }, + { + "text": "I", + "start": 32.44, + "end": 32.84, + "confidence": 0.385 + }, + { + "text": "got", + "start": 32.84, + "end": 33.16, + "confidence": 0.967 + }, + { + "text": "them.", + "start": 33.16, + "end": 33.44, + "confidence": 0.958 + }, + { + "text": "They're", + "start": 33.44, + "end": 33.5, + "confidence": 0.389 + }, + { + "text": "the", + "start": 33.5, + "end": 33.56, + "confidence": 0.312 + }, + { + "text": "better", + "start": 33.56, + "end": 33.76, + "confidence": 0.763 + }, + { + "text": "now.", + "start": 33.76, + "end": 34.03, + "confidence": 0.795 + } + ] + }, + { + "id": 6, + "seek": 2500, + "start": 34.03, + "end": 36.36, + "text": " They're the one that got the one right there.", + "tokens": [ + 50814, + 814, + 434, + 264, + 472, + 300, + 658, + 264, + 472, + 558, + 456, + 13, + 50964 + ], + "temperature": 0.1, + "avg_logprob": -0.7381767340465984, + "compression_ratio": 1.920731707317073, + "no_speech_prob": 0.8235840797424316, + "confidence": 0.275, + "words": [ + { + "text": "They're", + "start": 34.03, + "end": 34.38, + "confidence": 0.243 + }, + { + "text": "the", + "start": 34.38, + "end": 34.58, + "confidence": 0.738 + }, + { + "text": "one", + "start": 34.58, + "end": 34.94, + "confidence": 0.279 + }, + { + "text": "that", + "start": 34.94, + "end": 35.28, + "confidence": 0.456 + }, + { + "text": "got", + "start": 35.28, + "end": 35.48, + "confidence": 0.186 + }, + { + "text": "the", + "start": 35.48, + "end": 35.68, + "confidence": 0.439 + }, + { + "text": "one", + "start": 35.68, + "end": 35.76, + "confidence": 0.154 + }, + { + "text": "right", + "start": 35.76, + "end": 36.04, + "confidence": 0.08 + }, + { + "text": "there.", + "start": 36.04, + "end": 36.36, + "confidence": 0.454 + } + ] + }, + { + "id": 7, + "seek": 2500, + "start": 37.62, + "end": 39.38, + "text": " They're going to the leak reshaping.", + "tokens": [ + 50964, + 814, + 434, + 516, + 281, + 264, + 17143, + 725, + 71, + 569, + 278, + 13, + 51114 + ], + "temperature": 0.1, + "avg_logprob": -0.7381767340465984, + "compression_ratio": 1.920731707317073, + "no_speech_prob": 0.8235840797424316, + "confidence": 0.287, + "words": [ + { + "text": "They're", + "start": 37.62, + "end": 37.96, + "confidence": 0.506 + }, + { + "text": "going", + "start": 37.96, + "end": 38.12, + "confidence": 0.907 + }, + { + "text": "to", + "start": 38.12, + "end": 38.36, + "confidence": 0.282 + }, + { + "text": "the", + "start": 38.36, + "end": 38.48, + "confidence": 0.145 + }, + { + "text": "leak", + "start": 38.48, + "end": 38.76, + "confidence": 0.068 + }, + { + "text": "reshaping.", + "start": 38.76, + "end": 39.38, + "confidence": 0.275 + } + ] + }, + { + "id": 8, + "seek": 2500, + "start": 39.88, + "end": 40.98, + "text": " We got them in there.", + "tokens": [ + 51114, + 492, + 658, + 552, + 294, + 456, + 13, + 51164 + ], + "temperature": 0.1, + "avg_logprob": -0.7381767340465984, + "compression_ratio": 1.920731707317073, + "no_speech_prob": 0.8235840797424316, + "confidence": 0.722, + "words": [ + { + "text": "We", + "start": 39.88, + "end": 40.22, + "confidence": 0.62 + }, + { + "text": "got", + "start": 40.22, + "end": 40.48, + "confidence": 0.571 + }, + { + "text": "them", + "start": 40.48, + "end": 40.64, + "confidence": 0.956 + }, + { + "text": "in", + "start": 40.64, + "end": 40.74, + "confidence": 0.946 + }, + { + "text": "there.", + "start": 40.74, + "end": 40.98, + "confidence": 0.612 + } + ] + }, + { + "id": 9, + "seek": 2500, + "start": 41.22, + "end": 41.98, + "text": " I got them in bags.", + "tokens": [ + 51164, + 286, + 658, + 552, + 294, + 10405, + 13, + 51264 + ], + "temperature": 0.1, + "avg_logprob": -0.7381767340465984, + "compression_ratio": 1.920731707317073, + "no_speech_prob": 0.8235840797424316, + "confidence": 0.397, + "words": [ + { + "text": "I", + "start": 41.22, + "end": 41.32, + "confidence": 0.236 + }, + { + "text": "got", + "start": 41.32, + "end": 41.5, + "confidence": 0.153 + }, + { + "text": "them", + "start": 41.5, + "end": 41.56, + "confidence": 0.852 + }, + { + "text": "in", + "start": 41.56, + "end": 41.72, + "confidence": 0.861 + }, + { + "text": "bags.", + "start": 41.72, + "end": 41.98, + "confidence": 0.374 + } + ] + }, + { + "id": 10, + "seek": 2500, + "start": 43.1, + "end": 44.48, + "text": " And I just...", + "tokens": [ + 51264, + 400, + 286, + 445, + 485, + 51364 + ], + "temperature": 0.1, + "avg_logprob": -0.7381767340465984, + "compression_ratio": 1.920731707317073, + "no_speech_prob": 0.8235840797424316, + "confidence": 0.367, + "words": [ + { + "text": "And", + "start": 43.1, + "end": 43.36, + "confidence": 0.573 + }, + { + "text": "I", + "start": 43.36, + "end": 44.0, + "confidence": 0.332 + }, + { + "text": "just...", + "start": 44.0, + "end": 44.48, + "confidence": 0.26 + } + ] + }, + { + "id": 11, + "seek": 2500, + "start": 45.22, + "end": 45.4, + "text": " Yeah.", + "tokens": [ + 51364, + 865, + 13, + 51414 + ], + "temperature": 0.1, + "avg_logprob": -0.7381767340465984, + "compression_ratio": 1.920731707317073, + "no_speech_prob": 0.8235840797424316, + "confidence": 0.283, + "words": [ + { + "text": "Yeah.", + "start": 45.22, + "end": 45.4, + "confidence": 0.283 + } + ] + }, + { + "id": 12, + "seek": 2500, + "start": 46.2, + "end": 47.4, + "text": " I got them in the album bags.", + "tokens": [ + 51414, + 286, + 658, + 552, + 294, + 264, + 6030, + 10405, + 13, + 51514 + ], + "temperature": 0.1, + "avg_logprob": -0.7381767340465984, + "compression_ratio": 1.920731707317073, + "no_speech_prob": 0.8235840797424316, + "confidence": 0.445, + "words": [ + { + "text": "I", + "start": 46.2, + "end": 46.38, + "confidence": 0.297 + }, + { + "text": "got", + "start": 46.38, + "end": 46.46, + "confidence": 0.548 + }, + { + "text": "them", + "start": 46.46, + "end": 46.5, + "confidence": 0.959 + }, + { + "text": "in", + "start": 46.5, + "end": 46.74, + "confidence": 0.906 + }, + { + "text": "the", + "start": 46.74, + "end": 46.92, + "confidence": 0.453 + }, + { + "text": "album", + "start": 46.92, + "end": 47.06, + "confidence": 0.22 + }, + { + "text": "bags.", + "start": 47.06, + "end": 47.4, + "confidence": 0.246 + } + ] + }, + { + "id": 13, + "seek": 2500, + "start": 48.22, + "end": 49.58, + "text": " At least it's in the album bags.", + "tokens": [ + 51514, + 1711, + 1935, + 309, + 311, + 294, + 264, + 6030, + 10405, + 13, + 51614 + ], + "temperature": 0.1, + "avg_logprob": -0.7381767340465984, + "compression_ratio": 1.920731707317073, + "no_speech_prob": 0.8235840797424316, + "confidence": 0.606, + "words": [ + { + "text": "At", + "start": 48.22, + "end": 48.34, + "confidence": 0.184 + }, + { + "text": "least", + "start": 48.34, + "end": 48.6, + "confidence": 0.907 + }, + { + "text": "it's", + "start": 48.6, + "end": 48.86, + "confidence": 0.567 + }, + { + "text": "in", + "start": 48.86, + "end": 48.96, + "confidence": 0.802 + }, + { + "text": "the", + "start": 48.96, + "end": 49.1, + "confidence": 0.586 + }, + { + "text": "album", + "start": 49.1, + "end": 49.22, + "confidence": 0.862 + }, + { + "text": "bags.", + "start": 49.22, + "end": 49.58, + "confidence": 0.837 + } + ] + }, + { + "id": 14, + "seek": 2500, + "start": 50.1, + "end": 50.6, + "text": " Right here.", + "tokens": [ + 51614, + 1779, + 510, + 13, + 51664 + ], + "temperature": 0.1, + "avg_logprob": -0.7381767340465984, + "compression_ratio": 1.920731707317073, + "no_speech_prob": 0.8235840797424316, + "confidence": 0.308, + "words": [ + { + "text": "Right", + "start": 50.1, + "end": 50.4, + "confidence": 0.29 + }, + { + "text": "here.", + "start": 50.4, + "end": 50.6, + "confidence": 0.327 + } + ] + }, + { + "id": 15, + "seek": 2500, + "start": 51.46, + "end": 51.83, + "text": " Right here.", + "tokens": [ + 51664, + 1779, + 510, + 13, + 51714 + ], + "temperature": 0.1, + "avg_logprob": -0.7381767340465984, + "compression_ratio": 1.920731707317073, + "no_speech_prob": 0.8235840797424316, + "confidence": 0.82, + "words": [ + { + "text": "Right", + "start": 51.46, + "end": 51.74, + "confidence": 0.73 + }, + { + "text": "here.", + "start": 51.74, + "end": 51.83, + "confidence": 0.921 + } + ] + }, + { + "id": 16, + "seek": 2500, + "start": 51.83, + "end": 52.88, + "text": " Yeah, we're taking Nick and me out.", + "tokens": [ + 51714, + 865, + 11, + 321, + 434, + 1940, + 9449, + 293, + 385, + 484, + 13, + 51764 + ], + "temperature": 0.1, + "avg_logprob": -0.7381767340465984, + "compression_ratio": 1.920731707317073, + "no_speech_prob": 0.8235840797424316, + "confidence": 0.395, + "words": [ + { + "text": "Yeah,", + "start": 51.83, + "end": 52.16, + "confidence": 0.158 + }, + { + "text": "we're", + "start": 52.16, + "end": 52.26, + "confidence": 0.635 + }, + { + "text": "taking", + "start": 52.26, + "end": 52.28, + "confidence": 0.611 + }, + { + "text": "Nick", + "start": 52.28, + "end": 52.52, + "confidence": 0.185 + }, + { + "text": "and", + "start": 52.52, + "end": 52.64, + "confidence": 0.143 + }, + { + "text": "me", + "start": 52.64, + "end": 52.74, + "confidence": 0.683 + }, + { + "text": "out.", + "start": 52.74, + "end": 52.88, + "confidence": 0.837 + } + ] + }, + { + "id": 17, + "seek": 5300, + "start": 53.1, + "end": 54.57, + "text": " Yeah, we're thinking next week on a...", + "tokens": [ + 50364, + 865, + 11, + 321, + 434, + 1953, + 958, + 1243, + 322, + 257, + 485, + 50464 + ], + "temperature": 0.1, + "avg_logprob": -0.519427408698861, + "compression_ratio": 1.7004219409282701, + "no_speech_prob": 0.4345245361328125, + "confidence": 0.419, + "words": [ + { + "text": "Yeah,", + "start": 53.1, + "end": 53.26, + "confidence": 0.657 + }, + { + "text": "we're", + "start": 53.34, + "end": 53.44, + "confidence": 0.583 + }, + { + "text": "thinking", + "start": 53.44, + "end": 53.62, + "confidence": 0.593 + }, + { + "text": "next", + "start": 53.62, + "end": 53.86, + "confidence": 0.343 + }, + { + "text": "week", + "start": 53.86, + "end": 54.06, + "confidence": 0.383 + }, + { + "text": "on", + "start": 54.06, + "end": 54.22, + "confidence": 0.251 + }, + { + "text": "a...", + "start": 54.22, + "end": 54.57, + "confidence": 0.216 + } + ] + }, + { + "id": 18, + "seek": 5300, + "start": 54.57, + "end": 57.34, + "text": " You know, we were...", + "tokens": [ + 50464, + 509, + 458, + 11, + 321, + 645, + 485, + 50564 + ], + "temperature": 0.1, + "avg_logprob": -0.519427408698861, + "compression_ratio": 1.7004219409282701, + "no_speech_prob": 0.4345245361328125, + "confidence": 0.463, + "words": [ + { + "text": "You", + "start": 54.57, + "end": 55.08, + "confidence": 0.18 + }, + { + "text": "know,", + "start": 55.08, + "end": 55.2, + "confidence": 0.915 + }, + { + "text": "we", + "start": 56.36, + "end": 56.62, + "confidence": 0.392 + }, + { + "text": "were...", + "start": 56.62, + "end": 57.34, + "confidence": 0.71 + } + ] + }, + { + "id": 19, + "seek": 5300, + "start": 57.86, + "end": 61.8, + "text": " We were going to hang with the cover, I tried it already.", + "tokens": [ + 50564, + 492, + 645, + 516, + 281, + 3967, + 365, + 264, + 2060, + 11, + 286, + 3031, + 309, + 1217, + 13, + 50814 + ], + "temperature": 0.1, + "avg_logprob": -0.519427408698861, + "compression_ratio": 1.7004219409282701, + "no_speech_prob": 0.4345245361328125, + "confidence": 0.421, + "words": [ + { + "text": "We", + "start": 57.86, + "end": 58.0, + "confidence": 0.388 + }, + { + "text": "were", + "start": 58.0, + "end": 58.4, + "confidence": 0.245 + }, + { + "text": "going", + "start": 58.4, + "end": 58.54, + "confidence": 0.258 + }, + { + "text": "to", + "start": 58.54, + "end": 58.7, + "confidence": 0.935 + }, + { + "text": "hang", + "start": 58.7, + "end": 58.72, + "confidence": 0.406 + }, + { + "text": "with", + "start": 58.72, + "end": 59.22, + "confidence": 0.25 + }, + { + "text": "the", + "start": 59.22, + "end": 59.5, + "confidence": 0.191 + }, + { + "text": "cover,", + "start": 59.5, + "end": 61.02, + "confidence": 0.352 + }, + { + "text": "I", + "start": 61.18, + "end": 61.24, + "confidence": 0.573 + }, + { + "text": "tried", + "start": 61.24, + "end": 61.44, + "confidence": 0.644 + }, + { + "text": "it", + "start": 61.44, + "end": 61.62, + "confidence": 0.602 + }, + { + "text": "already.", + "start": 61.62, + "end": 61.8, + "confidence": 0.896 + } + ] + }, + { + "id": 20, + "seek": 5300, + "start": 62.52, + "end": 65.12, + "text": " Okay, fine, we weren't sure of that, just a suggestion.", + "tokens": [ + 50814, + 1033, + 11, + 2489, + 11, + 321, + 4999, + 380, + 988, + 295, + 300, + 11, + 445, + 257, + 16541, + 13, + 50964 + ], + "temperature": 0.1, + "avg_logprob": -0.519427408698861, + "compression_ratio": 1.7004219409282701, + "no_speech_prob": 0.4345245361328125, + "confidence": 0.86, + "words": [ + { + "text": "Okay,", + "start": 62.52, + "end": 62.78, + "confidence": 0.731 + }, + { + "text": "fine,", + "start": 62.9, + "end": 63.06, + "confidence": 0.955 + }, + { + "text": "we", + "start": 63.16, + "end": 63.3, + "confidence": 0.968 + }, + { + "text": "weren't", + "start": 63.3, + "end": 63.56, + "confidence": 0.993 + }, + { + "text": "sure", + "start": 63.56, + "end": 63.72, + "confidence": 0.974 + }, + { + "text": "of", + "start": 63.72, + "end": 63.86, + "confidence": 0.598 + }, + { + "text": "that,", + "start": 63.86, + "end": 63.98, + "confidence": 0.993 + }, + { + "text": "just", + "start": 64.1, + "end": 64.56, + "confidence": 0.637 + }, + { + "text": "a", + "start": 64.56, + "end": 64.74, + "confidence": 0.779 + }, + { + "text": "suggestion.", + "start": 64.74, + "end": 65.12, + "confidence": 0.998 + } + ] + }, + { + "id": 21, + "seek": 5300, + "start": 65.22, + "end": 67.7, + "text": " We thought we'd... you could check it out.", + "tokens": [ + 50964, + 492, + 1194, + 321, + 1116, + 485, + 291, + 727, + 1520, + 309, + 484, + 13, + 51114 + ], + "temperature": 0.1, + "avg_logprob": -0.519427408698861, + "compression_ratio": 1.7004219409282701, + "no_speech_prob": 0.4345245361328125, + "confidence": 0.794, + "words": [ + { + "text": "We", + "start": 65.22, + "end": 65.42, + "confidence": 0.896 + }, + { + "text": "thought", + "start": 65.42, + "end": 65.54, + "confidence": 0.983 + }, + { + "text": "we'd...", + "start": 65.54, + "end": 66.06, + "confidence": 0.818 + }, + { + "text": "you", + "start": 66.06, + "end": 67.04, + "confidence": 0.308 + }, + { + "text": "could", + "start": 67.04, + "end": 67.2, + "confidence": 0.777 + }, + { + "text": "check", + "start": 67.2, + "end": 67.38, + "confidence": 0.888 + }, + { + "text": "it", + "start": 67.38, + "end": 67.54, + "confidence": 0.996 + }, + { + "text": "out.", + "start": 67.54, + "end": 67.7, + "confidence": 0.998 + } + ] + }, + { + "id": 22, + "seek": 5300, + "start": 68.2, + "end": 69.26, + "text": " I'm not sure if you've already done that.", + "tokens": [ + 51114, + 286, + 478, + 406, + 988, + 498, + 291, + 600, + 1217, + 1096, + 300, + 13, + 51214 + ], + "temperature": 0.1, + "avg_logprob": -0.519427408698861, + "compression_ratio": 1.7004219409282701, + "no_speech_prob": 0.4345245361328125, + "confidence": 0.465, + "words": [ + { + "text": "I'm", + "start": 68.2, + "end": 68.44, + "confidence": 0.341 + }, + { + "text": "not", + "start": 68.44, + "end": 68.5, + "confidence": 0.399 + }, + { + "text": "sure", + "start": 68.5, + "end": 68.64, + "confidence": 0.854 + }, + { + "text": "if", + "start": 68.64, + "end": 68.66, + "confidence": 0.463 + }, + { + "text": "you've", + "start": 68.66, + "end": 68.72, + "confidence": 0.384 + }, + { + "text": "already", + "start": 68.72, + "end": 68.86, + "confidence": 0.427 + }, + { + "text": "done", + "start": 68.86, + "end": 69.06, + "confidence": 0.408 + }, + { + "text": "that.", + "start": 69.06, + "end": 69.26, + "confidence": 0.993 + } + ] + }, + { + "id": 23, + "seek": 5300, + "start": 69.5, + "end": 72.44, + "text": " So, I guess we're going to come up with this, let us know.", + "tokens": [ + 51214, + 407, + 11, + 286, + 2041, + 321, + 434, + 516, + 281, + 808, + 493, + 365, + 341, + 11, + 718, + 505, + 458, + 13, + 51364 + ], + "temperature": 0.1, + "avg_logprob": -0.519427408698861, + "compression_ratio": 1.7004219409282701, + "no_speech_prob": 0.4345245361328125, + "confidence": 0.746, + "words": [ + { + "text": "So,", + "start": 69.5, + "end": 69.6, + "confidence": 0.664 + }, + { + "text": "I", + "start": 69.7, + "end": 69.88, + "confidence": 0.812 + }, + { + "text": "guess", + "start": 69.88, + "end": 70.62, + "confidence": 0.99 + }, + { + "text": "we're", + "start": 70.62, + "end": 71.08, + "confidence": 0.743 + }, + { + "text": "going", + "start": 71.08, + "end": 71.22, + "confidence": 0.542 + }, + { + "text": "to", + "start": 71.22, + "end": 71.28, + "confidence": 0.989 + }, + { + "text": "come", + "start": 71.28, + "end": 71.42, + "confidence": 0.936 + }, + { + "text": "up", + "start": 71.42, + "end": 71.6, + "confidence": 0.676 + }, + { + "text": "with", + "start": 71.6, + "end": 71.76, + "confidence": 0.966 + }, + { + "text": "this,", + "start": 71.76, + "end": 71.9, + "confidence": 0.239 + }, + { + "text": "let", + "start": 72.1, + "end": 72.12, + "confidence": 0.718 + }, + { + "text": "us", + "start": 72.12, + "end": 72.24, + "confidence": 0.997 + }, + { + "text": "know.", + "start": 72.24, + "end": 72.44, + "confidence": 0.998 + } + ] + }, + { + "id": 24, + "seek": 5300, + "start": 74.22, + "end": 75.16, + "text": " Okay, no problem.", + "tokens": [ + 51414, + 1033, + 11, + 572, + 1154, + 13, + 51464 + ], + "temperature": 0.1, + "avg_logprob": -0.519427408698861, + "compression_ratio": 1.7004219409282701, + "no_speech_prob": 0.4345245361328125, + "confidence": 0.903, + "words": [ + { + "text": "Okay,", + "start": 74.22, + "end": 74.48, + "confidence": 0.835 + }, + { + "text": "no", + "start": 74.58, + "end": 74.82, + "confidence": 0.913 + }, + { + "text": "problem.", + "start": 74.82, + "end": 75.16, + "confidence": 0.968 + } + ] + }, + { + "id": 25, + "seek": 5300, + "start": 75.2, + "end": 76.48, + "text": " Okay, no problem.", + "tokens": [ + 51464, + 1033, + 11, + 572, + 1154, + 13, + 51514 + ], + "temperature": 0.1, + "avg_logprob": -0.519427408698861, + "compression_ratio": 1.7004219409282701, + "no_speech_prob": 0.4345245361328125, + "confidence": 0.819, + "words": [ + { + "text": "Okay,", + "start": 75.2, + "end": 75.8, + "confidence": 0.607 + }, + { + "text": "no", + "start": 75.92, + "end": 76.14, + "confidence": 0.908 + }, + { + "text": "problem.", + "start": 76.14, + "end": 76.48, + "confidence": 0.995 + } + ] + }, + { + "id": 26, + "seek": 5300, + "start": 76.54, + "end": 77.86, + "text": " We'll let you know when the end of the...", + "tokens": [ + 51514, + 492, + 603, + 718, + 291, + 458, + 562, + 264, + 917, + 295, + 264, + 485, + 51614 + ], + "temperature": 0.1, + "avg_logprob": -0.519427408698861, + "compression_ratio": 1.7004219409282701, + "no_speech_prob": 0.4345245361328125, + "confidence": 0.739, + "words": [ + { + "text": "We'll", + "start": 76.54, + "end": 76.8, + "confidence": 0.755 + }, + { + "text": "let", + "start": 76.8, + "end": 76.92, + "confidence": 0.955 + }, + { + "text": "you", + "start": 76.92, + "end": 77.0, + "confidence": 0.628 + }, + { + "text": "know", + "start": 77.0, + "end": 77.16, + "confidence": 0.997 + }, + { + "text": "when", + "start": 77.16, + "end": 77.32, + "confidence": 0.421 + }, + { + "text": "the", + "start": 77.32, + "end": 77.4, + "confidence": 0.856 + }, + { + "text": "end", + "start": 77.4, + "end": 77.52, + "confidence": 0.978 + }, + { + "text": "of", + "start": 77.52, + "end": 77.64, + "confidence": 0.98 + }, + { + "text": "the...", + "start": 77.64, + "end": 77.86, + "confidence": 0.413 + } + ] + }, + { + "id": 27, + "seek": 5300, + "start": 78.02, + "end": 78.24, + "text": " ...sun.", + "tokens": [ + 51614, + 1097, + 11314, + 13, + 51664 + ], + "temperature": 0.1, + "avg_logprob": -0.519427408698861, + "compression_ratio": 1.7004219409282701, + "no_speech_prob": 0.4345245361328125, + "confidence": 0.158, + "words": [ + { + "text": "...sun.", + "start": 78.02, + "end": 78.24, + "confidence": 0.158 + } + ] + }, + { + "id": 28, + "seek": 8300, + "start": 88.8, + "end": 88.82, + "text": " Bye.", + "tokens": [ + 50364, + 4621, + 13, + 50664 + ], + "temperature": 0.1, + "avg_logprob": -1.232518768310547, + "compression_ratio": 0.3333333333333333, + "no_speech_prob": 0.592905580997467, + "confidence": 0.069, + "words": [ + { + "text": "Bye.", + "start": 88.8, + "end": 88.82, + "confidence": 0.069 + } + ] + } + ], + "language": "English" +} \ No newline at end of file diff --git a/tests/expected/corner_cases/random_apollo11.mp3.words.json b/tests/expected/corner_cases/random_apollo11.mp3.words.json new file mode 100644 index 0000000000000000000000000000000000000000..b4390210f6149284e2dcb88c6a807e9f9cdd3769 --- /dev/null +++ b/tests/expected/corner_cases/random_apollo11.mp3.words.json @@ -0,0 +1,1812 @@ +{ + "text": " Apollo 11, Houston we got a recommendation for you on your Soyuz-EA GLEME GVA. Alright, okay. Yeah, let's take that camera. They make it want to go on the helmet. We're going to have a B1 and you can put the other one on the mic helmet with those GVA. Over. Alright, got them. Alright, got them. They're the better helmet that C1 has. They got the one mic that makes going through the leak reshapes. We got them in there helmet bags. And uh, we got the helmet in there helmet bags. The leak system, the leak of the bag. Right, yeah. Yeah, we're taking the leak to the auto, see you later. Hey, we were going to hang with the cover on the right side already. Okay, fine. We weren't sure of that, just a suggestion. We thought we'd, uh, you could check it out. It's not much of a hard to turn on, so uh, I guess we're going to come up with just let us know. Okay, no problem. Okay, no problem. We'll let you know when the end of the sun. Hello.", + "segments": [ + { + "id": 0, + "seek": 0, + "start": 0.52, + "end": 6.54, + "text": " Apollo 11, Houston we got a recommendation for you on your Soyuz-EA GLEME GVA.", + "tokens": [ + 50364, + 25187, + 2975, + 11, + 18717, + 321, + 658, + 257, + 11879, + 337, + 291, + 322, + 428, + 24758, + 3334, + 12, + 36, + 32, + 460, + 2634, + 15454, + 460, + 20914, + 13, + 50714 + ], + "temperature": 0.2, + "avg_logprob": -0.6685471307663691, + "compression_ratio": 1.3597883597883598, + "no_speech_prob": 0.44998496770858765, + "confidence": 0.548, + "words": [ + { + "text": "Apollo", + "start": 0.52, + "end": 0.88, + "confidence": 0.155 + }, + { + "text": "11,", + "start": 0.88, + "end": 1.26, + "confidence": 0.977 + }, + { + "text": "Houston", + "start": 1.52, + "end": 1.72, + "confidence": 0.986 + }, + { + "text": "we", + "start": 1.72, + "end": 1.94, + "confidence": 0.518 + }, + { + "text": "got", + "start": 1.94, + "end": 2.1, + "confidence": 0.823 + }, + { + "text": "a", + "start": 2.1, + "end": 2.26, + "confidence": 0.989 + }, + { + "text": "recommendation", + "start": 2.26, + "end": 2.86, + "confidence": 0.968 + }, + { + "text": "for", + "start": 2.86, + "end": 3.44, + "confidence": 0.946 + }, + { + "text": "you", + "start": 3.44, + "end": 3.6, + "confidence": 0.984 + }, + { + "text": "on", + "start": 3.6, + "end": 3.72, + "confidence": 0.909 + }, + { + "text": "your", + "start": 3.72, + "end": 3.92, + "confidence": 0.971 + }, + { + "text": "Soyuz-EA", + "start": 3.92, + "end": 5.26, + "confidence": 0.321 + }, + { + "text": "GLEME", + "start": 5.26, + "end": 5.74, + "confidence": 0.558 + }, + { + "text": "GVA.", + "start": 5.74, + "end": 6.54, + "confidence": 0.336 + } + ] + }, + { + "id": 1, + "seek": 0, + "start": 10.8, + "end": 12.2, + "text": " Alright, okay.", + "tokens": [ + 50914, + 2798, + 11, + 1392, + 13, + 50964 + ], + "temperature": 0.2, + "avg_logprob": -0.6685471307663691, + "compression_ratio": 1.3597883597883598, + "no_speech_prob": 0.44998496770858765, + "confidence": 0.366, + "words": [ + { + "text": "Alright,", + "start": 10.8, + "end": 11.08, + "confidence": 0.282 + }, + { + "text": "okay.", + "start": 11.68, + "end": 12.2, + "confidence": 0.476 + } + ] + }, + { + "id": 2, + "seek": 0, + "start": 12.82, + "end": 14.4, + "text": " Yeah, let's take that camera.", + "tokens": [ + 51014, + 865, + 11, + 718, + 311, + 747, + 300, + 2799, + 13, + 51064 + ], + "temperature": 0.2, + "avg_logprob": -0.6685471307663691, + "compression_ratio": 1.3597883597883598, + "no_speech_prob": 0.44998496770858765, + "confidence": 0.357, + "words": [ + { + "text": "Yeah,", + "start": 12.82, + "end": 13.0, + "confidence": 0.167 + }, + { + "text": "let's", + "start": 13.04, + "end": 13.38, + "confidence": 0.277 + }, + { + "text": "take", + "start": 13.38, + "end": 14.02, + "confidence": 0.398 + }, + { + "text": "that", + "start": 14.02, + "end": 14.26, + "confidence": 0.478 + }, + { + "text": "camera.", + "start": 14.26, + "end": 14.4, + "confidence": 0.849 + } + ] + }, + { + "id": 3, + "seek": 0, + "start": 14.84, + "end": 17.26, + "text": " They make it want to go on the helmet.", + "tokens": [ + 51114, + 814, + 652, + 309, + 528, + 281, + 352, + 322, + 264, + 15922, + 13, + 51214 + ], + "temperature": 0.2, + "avg_logprob": -0.6685471307663691, + "compression_ratio": 1.3597883597883598, + "no_speech_prob": 0.44998496770858765, + "confidence": 0.551, + "words": [ + { + "text": "They", + "start": 14.84, + "end": 15.48, + "confidence": 0.397 + }, + { + "text": "make", + "start": 15.48, + "end": 15.68, + "confidence": 0.428 + }, + { + "text": "it", + "start": 15.68, + "end": 15.86, + "confidence": 0.21 + }, + { + "text": "want", + "start": 15.86, + "end": 16.06, + "confidence": 0.24 + }, + { + "text": "to", + "start": 16.06, + "end": 16.2, + "confidence": 0.965 + }, + { + "text": "go", + "start": 16.2, + "end": 16.38, + "confidence": 0.904 + }, + { + "text": "on", + "start": 16.38, + "end": 16.6, + "confidence": 0.952 + }, + { + "text": "the", + "start": 16.6, + "end": 16.8, + "confidence": 0.889 + }, + { + "text": "helmet.", + "start": 16.8, + "end": 17.26, + "confidence": 0.745 + } + ] + }, + { + "id": 4, + "seek": 0, + "start": 17.62, + "end": 23.74, + "text": " We're going to have a B1 and you can put the other one on the mic helmet with those GVA.", + "tokens": [ + 51264, + 492, + 434, + 516, + 281, + 362, + 257, + 363, + 16, + 293, + 291, + 393, + 829, + 264, + 661, + 472, + 322, + 264, + 3123, + 15922, + 365, + 729, + 460, + 20914, + 13, + 51564 + ], + "temperature": 0.2, + "avg_logprob": -0.6685471307663691, + "compression_ratio": 1.3597883597883598, + "no_speech_prob": 0.44998496770858765, + "confidence": 0.672, + "words": [ + { + "text": "We're", + "start": 17.62, + "end": 17.8, + "confidence": 0.779 + }, + { + "text": "going", + "start": 17.8, + "end": 17.92, + "confidence": 0.633 + }, + { + "text": "to", + "start": 17.92, + "end": 17.98, + "confidence": 0.992 + }, + { + "text": "have", + "start": 17.98, + "end": 18.2, + "confidence": 0.953 + }, + { + "text": "a", + "start": 18.2, + "end": 18.38, + "confidence": 0.36 + }, + { + "text": "B1", + "start": 18.38, + "end": 19.08, + "confidence": 0.836 + }, + { + "text": "and", + "start": 19.08, + "end": 20.16, + "confidence": 0.42 + }, + { + "text": "you", + "start": 20.16, + "end": 20.32, + "confidence": 0.865 + }, + { + "text": "can", + "start": 20.32, + "end": 20.48, + "confidence": 0.699 + }, + { + "text": "put", + "start": 20.48, + "end": 20.64, + "confidence": 0.971 + }, + { + "text": "the", + "start": 20.64, + "end": 20.84, + "confidence": 0.976 + }, + { + "text": "other", + "start": 20.84, + "end": 21.0, + "confidence": 0.995 + }, + { + "text": "one", + "start": 21.0, + "end": 21.18, + "confidence": 0.97 + }, + { + "text": "on", + "start": 21.18, + "end": 21.42, + "confidence": 0.988 + }, + { + "text": "the", + "start": 21.42, + "end": 21.94, + "confidence": 0.627 + }, + { + "text": "mic", + "start": 21.94, + "end": 22.48, + "confidence": 0.391 + }, + { + "text": "helmet", + "start": 22.48, + "end": 22.8, + "confidence": 0.935 + }, + { + "text": "with", + "start": 22.8, + "end": 23.06, + "confidence": 0.466 + }, + { + "text": "those", + "start": 23.06, + "end": 23.3, + "confidence": 0.358 + }, + { + "text": "GVA.", + "start": 23.3, + "end": 23.74, + "confidence": 0.363 + } + ] + }, + { + "id": 5, + "seek": 0, + "start": 24.88, + "end": 25.12, + "text": " Over.", + "tokens": [ + 51614, + 4886, + 13, + 51664 + ], + "temperature": 0.2, + "avg_logprob": -0.6685471307663691, + "compression_ratio": 1.3597883597883598, + "no_speech_prob": 0.44998496770858765, + "confidence": 0.29, + "words": [ + { + "text": "Over.", + "start": 24.88, + "end": 25.12, + "confidence": 0.29 + } + ] + }, + { + "id": 6, + "seek": 3000, + "start": 31.28, + "end": 32.12, + "text": " Alright, got them.", + "tokens": [ + 50414, + 2798, + 11, + 658, + 552, + 13, + 50464 + ], + "temperature": 0.2, + "avg_logprob": -0.7122965494791667, + "compression_ratio": 1.8131868131868132, + "no_speech_prob": 0.07163436710834503, + "confidence": 0.531, + "words": [ + { + "text": "Alright,", + "start": 31.28, + "end": 31.56, + "confidence": 0.866 + }, + { + "text": "got", + "start": 31.82, + "end": 31.86, + "confidence": 0.43 + }, + { + "text": "them.", + "start": 31.86, + "end": 32.12, + "confidence": 0.402 + } + ] + }, + { + "id": 7, + "seek": 3000, + "start": 32.74, + "end": 33.44, + "text": " Alright, got them.", + "tokens": [ + 50514, + 2798, + 11, + 658, + 552, + 13, + 50564 + ], + "temperature": 0.2, + "avg_logprob": -0.7122965494791667, + "compression_ratio": 1.8131868131868132, + "no_speech_prob": 0.07163436710834503, + "confidence": 0.879, + "words": [ + { + "text": "Alright,", + "start": 32.74, + "end": 32.92, + "confidence": 0.74 + }, + { + "text": "got", + "start": 33.12, + "end": 33.18, + "confidence": 0.939 + }, + { + "text": "them.", + "start": 33.18, + "end": 33.44, + "confidence": 0.976 + } + ] + }, + { + "id": 8, + "seek": 3000, + "start": 34.5, + "end": 35.3, + "text": " They're the better helmet that C1 has.", + "tokens": [ + 50614, + 814, + 434, + 264, + 1101, + 15922, + 300, + 383, + 16, + 575, + 13, + 50664 + ], + "temperature": 0.2, + "avg_logprob": -0.7122965494791667, + "compression_ratio": 1.8131868131868132, + "no_speech_prob": 0.07163436710834503, + "confidence": 0.373, + "words": [ + { + "text": "They're", + "start": 34.5, + "end": 34.52, + "confidence": 0.222 + }, + { + "text": "the", + "start": 34.52, + "end": 34.54, + "confidence": 0.185 + }, + { + "text": "better", + "start": 34.54, + "end": 34.56, + "confidence": 0.512 + }, + { + "text": "helmet", + "start": 34.56, + "end": 34.58, + "confidence": 0.699 + }, + { + "text": "that", + "start": 34.58, + "end": 34.6, + "confidence": 0.247 + }, + { + "text": "C1", + "start": 34.6, + "end": 34.92, + "confidence": 0.464 + }, + { + "text": "has.", + "start": 34.92, + "end": 35.3, + "confidence": 0.799 + } + ] + }, + { + "id": 9, + "seek": 3000, + "start": 37.58, + "end": 39.34, + "text": " They got the one mic that makes going through the leak reshapes.", + "tokens": [ + 50714, + 814, + 658, + 264, + 472, + 3123, + 300, + 1669, + 516, + 807, + 264, + 17143, + 725, + 71, + 569, + 279, + 13, + 50814 + ], + "temperature": 0.2, + "avg_logprob": -0.7122965494791667, + "compression_ratio": 1.8131868131868132, + "no_speech_prob": 0.07163436710834503, + "confidence": 0.362, + "words": [ + { + "text": "They", + "start": 37.58, + "end": 37.8, + "confidence": 0.355 + }, + { + "text": "got", + "start": 37.8, + "end": 37.9, + "confidence": 0.372 + }, + { + "text": "the", + "start": 37.9, + "end": 37.92, + "confidence": 0.702 + }, + { + "text": "one", + "start": 37.92, + "end": 37.94, + "confidence": 0.721 + }, + { + "text": "mic", + "start": 37.94, + "end": 37.96, + "confidence": 0.632 + }, + { + "text": "that", + "start": 37.96, + "end": 37.98, + "confidence": 0.117 + }, + { + "text": "makes", + "start": 37.98, + "end": 38.0, + "confidence": 0.191 + }, + { + "text": "going", + "start": 38.0, + "end": 38.12, + "confidence": 0.749 + }, + { + "text": "through", + "start": 38.12, + "end": 38.34, + "confidence": 0.305 + }, + { + "text": "the", + "start": 38.34, + "end": 38.5, + "confidence": 0.397 + }, + { + "text": "leak", + "start": 38.5, + "end": 38.76, + "confidence": 0.41 + }, + { + "text": "reshapes.", + "start": 38.76, + "end": 39.34, + "confidence": 0.288 + } + ] + }, + { + "id": 10, + "seek": 3000, + "start": 39.9, + "end": 41.94, + "text": " We got them in there helmet bags.", + "tokens": [ + 50864, + 492, + 658, + 552, + 294, + 456, + 15922, + 10405, + 13, + 50964 + ], + "temperature": 0.2, + "avg_logprob": -0.7122965494791667, + "compression_ratio": 1.8131868131868132, + "no_speech_prob": 0.07163436710834503, + "confidence": 0.576, + "words": [ + { + "text": "We", + "start": 39.9, + "end": 40.2, + "confidence": 0.487 + }, + { + "text": "got", + "start": 40.2, + "end": 40.48, + "confidence": 0.582 + }, + { + "text": "them", + "start": 40.48, + "end": 40.64, + "confidence": 0.881 + }, + { + "text": "in", + "start": 40.64, + "end": 40.74, + "confidence": 0.917 + }, + { + "text": "there", + "start": 40.74, + "end": 40.96, + "confidence": 0.418 + }, + { + "text": "helmet", + "start": 40.96, + "end": 41.52, + "confidence": 0.654 + }, + { + "text": "bags.", + "start": 41.52, + "end": 41.94, + "confidence": 0.336 + } + ] + }, + { + "id": 11, + "seek": 3000, + "start": 43.02, + "end": 47.4, + "text": " And uh, we got the helmet in there helmet bags.", + "tokens": [ + 51014, + 400, + 2232, + 11, + 321, + 658, + 264, + 15922, + 294, + 456, + 15922, + 10405, + 13, + 51264 + ], + "temperature": 0.2, + "avg_logprob": -0.7122965494791667, + "compression_ratio": 1.8131868131868132, + "no_speech_prob": 0.07163436710834503, + "confidence": 0.431, + "words": [ + { + "text": "And", + "start": 43.02, + "end": 43.34, + "confidence": 0.575 + }, + { + "text": "uh,", + "start": 43.34, + "end": 43.74, + "confidence": 0.208 + }, + { + "text": "we", + "start": 43.86, + "end": 44.04, + "confidence": 0.423 + }, + { + "text": "got", + "start": 44.04, + "end": 44.2, + "confidence": 0.549 + }, + { + "text": "the", + "start": 44.2, + "end": 44.5, + "confidence": 0.209 + }, + { + "text": "helmet", + "start": 44.5, + "end": 46.46, + "confidence": 0.845 + }, + { + "text": "in", + "start": 46.46, + "end": 46.72, + "confidence": 0.188 + }, + { + "text": "there", + "start": 46.72, + "end": 47.06, + "confidence": 0.391 + }, + { + "text": "helmet", + "start": 47.06, + "end": 47.08, + "confidence": 0.69 + }, + { + "text": "bags.", + "start": 47.08, + "end": 47.4, + "confidence": 0.889 + } + ] + }, + { + "id": 12, + "seek": 3000, + "start": 48.5, + "end": 49.58, + "text": " The leak system, the leak of the bag.", + "tokens": [ + 51314, + 440, + 17143, + 1185, + 11, + 264, + 17143, + 295, + 264, + 3411, + 13, + 51364 + ], + "temperature": 0.2, + "avg_logprob": -0.7122965494791667, + "compression_ratio": 1.8131868131868132, + "no_speech_prob": 0.07163436710834503, + "confidence": 0.499, + "words": [ + { + "text": "The", + "start": 48.5, + "end": 48.52, + "confidence": 0.266 + }, + { + "text": "leak", + "start": 48.52, + "end": 48.6, + "confidence": 0.299 + }, + { + "text": "system,", + "start": 48.6, + "end": 48.86, + "confidence": 0.54 + }, + { + "text": "the", + "start": 49.06, + "end": 49.14, + "confidence": 0.589 + }, + { + "text": "leak", + "start": 49.14, + "end": 49.22, + "confidence": 0.962 + }, + { + "text": "of", + "start": 49.22, + "end": 49.32, + "confidence": 0.244 + }, + { + "text": "the", + "start": 49.32, + "end": 49.4, + "confidence": 0.941 + }, + { + "text": "bag.", + "start": 49.4, + "end": 49.58, + "confidence": 0.689 + } + ] + }, + { + "id": 13, + "seek": 3000, + "start": 51.34, + "end": 51.94, + "text": " Right, yeah.", + "tokens": [ + 51414, + 1779, + 11, + 1338, + 13, + 51464 + ], + "temperature": 0.2, + "avg_logprob": -0.7122965494791667, + "compression_ratio": 1.8131868131868132, + "no_speech_prob": 0.07163436710834503, + "confidence": 0.369, + "words": [ + { + "text": "Right,", + "start": 51.34, + "end": 51.72, + "confidence": 0.187 + }, + { + "text": "yeah.", + "start": 51.82, + "end": 51.94, + "confidence": 0.73 + } + ] + }, + { + "id": 14, + "seek": 3000, + "start": 53.06, + "end": 55.22, + "text": " Yeah, we're taking the leak to the auto, see you later.", + "tokens": [ + 51514, + 865, + 11, + 321, + 434, + 1940, + 264, + 17143, + 281, + 264, + 8399, + 11, + 536, + 291, + 1780, + 13, + 51614 + ], + "temperature": 0.2, + "avg_logprob": -0.7122965494791667, + "compression_ratio": 1.8131868131868132, + "no_speech_prob": 0.07163436710834503, + "confidence": 0.425, + "words": [ + { + "text": "Yeah,", + "start": 53.06, + "end": 53.26, + "confidence": 0.561 + }, + { + "text": "we're", + "start": 53.34, + "end": 53.42, + "confidence": 0.725 + }, + { + "text": "taking", + "start": 53.42, + "end": 53.62, + "confidence": 0.683 + }, + { + "text": "the", + "start": 53.62, + "end": 53.8, + "confidence": 0.661 + }, + { + "text": "leak", + "start": 53.8, + "end": 53.88, + "confidence": 0.396 + }, + { + "text": "to", + "start": 53.88, + "end": 54.02, + "confidence": 0.08 + }, + { + "text": "the", + "start": 54.02, + "end": 54.08, + "confidence": 0.935 + }, + { + "text": "auto,", + "start": 54.08, + "end": 54.26, + "confidence": 0.228 + }, + { + "text": "see", + "start": 54.46, + "end": 54.58, + "confidence": 0.191 + }, + { + "text": "you", + "start": 54.58, + "end": 55.14, + "confidence": 0.401 + }, + { + "text": "later.", + "start": 55.14, + "end": 55.22, + "confidence": 0.503 + } + ] + }, + { + "id": 15, + "seek": 5500, + "start": 56.4, + "end": 61.48, + "text": " Hey, we were going to hang with the cover on the right side already.", + "tokens": [ + 50414, + 1911, + 11, + 321, + 645, + 516, + 281, + 3967, + 365, + 264, + 2060, + 322, + 264, + 558, + 1252, + 1217, + 13, + 50664 + ], + "temperature": 0.2, + "avg_logprob": -0.4537031500189154, + "compression_ratio": 1.6168224299065421, + "no_speech_prob": 0.3397921025753021, + "confidence": 0.371, + "words": [ + { + "text": "Hey,", + "start": 56.4, + "end": 56.6, + "confidence": 0.195 + }, + { + "text": "we", + "start": 56.62, + "end": 56.74, + "confidence": 0.949 + }, + { + "text": "were", + "start": 56.74, + "end": 56.9, + "confidence": 0.526 + }, + { + "text": "going", + "start": 56.9, + "end": 57.1, + "confidence": 0.184 + }, + { + "text": "to", + "start": 57.1, + "end": 57.22, + "confidence": 0.938 + }, + { + "text": "hang", + "start": 57.22, + "end": 57.38, + "confidence": 0.255 + }, + { + "text": "with", + "start": 57.38, + "end": 59.24, + "confidence": 0.252 + }, + { + "text": "the", + "start": 59.24, + "end": 60.24, + "confidence": 0.529 + }, + { + "text": "cover", + "start": 60.24, + "end": 61.02, + "confidence": 0.737 + }, + { + "text": "on", + "start": 61.02, + "end": 61.22, + "confidence": 0.324 + }, + { + "text": "the", + "start": 61.22, + "end": 61.28, + "confidence": 0.44 + }, + { + "text": "right", + "start": 61.28, + "end": 61.3, + "confidence": 0.088 + }, + { + "text": "side", + "start": 61.3, + "end": 61.4, + "confidence": 0.4 + }, + { + "text": "already.", + "start": 61.4, + "end": 61.48, + "confidence": 0.447 + } + ] + }, + { + "id": 16, + "seek": 5500, + "start": 62.52, + "end": 63.02, + "text": " Okay, fine.", + "tokens": [ + 50714, + 1033, + 11, + 2489, + 13, + 50764 + ], + "temperature": 0.2, + "avg_logprob": -0.4537031500189154, + "compression_ratio": 1.6168224299065421, + "no_speech_prob": 0.3397921025753021, + "confidence": 0.91, + "words": [ + { + "text": "Okay,", + "start": 62.52, + "end": 62.78, + "confidence": 0.914 + }, + { + "text": "fine.", + "start": 62.88, + "end": 63.02, + "confidence": 0.905 + } + ] + }, + { + "id": 17, + "seek": 5500, + "start": 63.02, + "end": 65.1, + "text": " We weren't sure of that, just a suggestion.", + "tokens": [ + 50764, + 492, + 4999, + 380, + 988, + 295, + 300, + 11, + 445, + 257, + 16541, + 13, + 50864 + ], + "temperature": 0.2, + "avg_logprob": -0.4537031500189154, + "compression_ratio": 1.6168224299065421, + "no_speech_prob": 0.3397921025753021, + "confidence": 0.842, + "words": [ + { + "text": "We", + "start": 63.02, + "end": 63.3, + "confidence": 0.937 + }, + { + "text": "weren't", + "start": 63.3, + "end": 63.56, + "confidence": 0.976 + }, + { + "text": "sure", + "start": 63.56, + "end": 63.72, + "confidence": 0.929 + }, + { + "text": "of", + "start": 63.72, + "end": 63.84, + "confidence": 0.502 + }, + { + "text": "that,", + "start": 63.84, + "end": 63.98, + "confidence": 0.986 + }, + { + "text": "just", + "start": 64.12, + "end": 64.56, + "confidence": 0.772 + }, + { + "text": "a", + "start": 64.56, + "end": 64.72, + "confidence": 0.675 + }, + { + "text": "suggestion.", + "start": 64.72, + "end": 65.1, + "confidence": 0.994 + } + ] + }, + { + "id": 18, + "seek": 5500, + "start": 65.2, + "end": 67.5, + "text": " We thought we'd, uh, you could check it out.", + "tokens": [ + 50864, + 492, + 1194, + 321, + 1116, + 11, + 2232, + 11, + 291, + 727, + 1520, + 309, + 484, + 13, + 50964 + ], + "temperature": 0.2, + "avg_logprob": -0.4537031500189154, + "compression_ratio": 1.6168224299065421, + "no_speech_prob": 0.3397921025753021, + "confidence": 0.754, + "words": [ + { + "text": "We", + "start": 65.2, + "end": 65.4, + "confidence": 0.915 + }, + { + "text": "thought", + "start": 65.4, + "end": 65.54, + "confidence": 0.972 + }, + { + "text": "we'd,", + "start": 65.54, + "end": 65.9, + "confidence": 0.679 + }, + { + "text": "uh,", + "start": 65.96, + "end": 66.02, + "confidence": 0.597 + }, + { + "text": "you", + "start": 66.78, + "end": 67.04, + "confidence": 0.408 + }, + { + "text": "could", + "start": 67.04, + "end": 67.2, + "confidence": 0.808 + }, + { + "text": "check", + "start": 67.2, + "end": 67.36, + "confidence": 0.751 + }, + { + "text": "it", + "start": 67.36, + "end": 67.48, + "confidence": 0.984 + }, + { + "text": "out.", + "start": 67.48, + "end": 67.5, + "confidence": 0.998 + } + ] + }, + { + "id": 19, + "seek": 5500, + "start": 68.2, + "end": 72.4, + "text": " It's not much of a hard to turn on, so uh, I guess we're going to come up with just let us know.", + "tokens": [ + 51014, + 467, + 311, + 406, + 709, + 295, + 257, + 1152, + 281, + 1261, + 322, + 11, + 370, + 2232, + 11, + 286, + 2041, + 321, + 434, + 516, + 281, + 808, + 493, + 365, + 445, + 718, + 505, + 458, + 13, + 51214 + ], + "temperature": 0.2, + "avg_logprob": -0.4537031500189154, + "compression_ratio": 1.6168224299065421, + "no_speech_prob": 0.3397921025753021, + "confidence": 0.608, + "words": [ + { + "text": "It's", + "start": 68.2, + "end": 68.3, + "confidence": 0.411 + }, + { + "text": "not", + "start": 68.3, + "end": 68.4, + "confidence": 0.946 + }, + { + "text": "much", + "start": 68.4, + "end": 68.56, + "confidence": 0.902 + }, + { + "text": "of", + "start": 68.56, + "end": 68.7, + "confidence": 0.574 + }, + { + "text": "a", + "start": 68.7, + "end": 68.72, + "confidence": 0.719 + }, + { + "text": "hard", + "start": 68.72, + "end": 68.84, + "confidence": 0.144 + }, + { + "text": "to", + "start": 68.84, + "end": 68.98, + "confidence": 0.405 + }, + { + "text": "turn", + "start": 68.98, + "end": 69.1, + "confidence": 0.673 + }, + { + "text": "on,", + "start": 69.1, + "end": 69.22, + "confidence": 0.157 + }, + { + "text": "so", + "start": 69.26, + "end": 69.56, + "confidence": 0.845 + }, + { + "text": "uh,", + "start": 69.56, + "end": 69.84, + "confidence": 0.31 + }, + { + "text": "I", + "start": 70.34, + "end": 70.5, + "confidence": 0.786 + }, + { + "text": "guess", + "start": 70.5, + "end": 70.64, + "confidence": 0.993 + }, + { + "text": "we're", + "start": 70.64, + "end": 71.08, + "confidence": 0.562 + }, + { + "text": "going", + "start": 71.08, + "end": 71.2, + "confidence": 0.781 + }, + { + "text": "to", + "start": 71.2, + "end": 71.28, + "confidence": 0.991 + }, + { + "text": "come", + "start": 71.28, + "end": 71.42, + "confidence": 0.964 + }, + { + "text": "up", + "start": 71.42, + "end": 71.6, + "confidence": 0.952 + }, + { + "text": "with", + "start": 71.6, + "end": 71.76, + "confidence": 0.954 + }, + { + "text": "just", + "start": 71.76, + "end": 71.94, + "confidence": 0.316 + }, + { + "text": "let", + "start": 71.94, + "end": 72.1, + "confidence": 0.811 + }, + { + "text": "us", + "start": 72.1, + "end": 72.24, + "confidence": 0.977 + }, + { + "text": "know.", + "start": 72.24, + "end": 72.4, + "confidence": 0.997 + } + ] + }, + { + "id": 20, + "seek": 5500, + "start": 74.22, + "end": 75.03, + "text": " Okay, no problem.", + "tokens": [ + 51314, + 1033, + 11, + 572, + 1154, + 13, + 51364 + ], + "temperature": 0.2, + "avg_logprob": -0.4537031500189154, + "compression_ratio": 1.6168224299065421, + "no_speech_prob": 0.3397921025753021, + "confidence": 0.912, + "words": [ + { + "text": "Okay,", + "start": 74.22, + "end": 74.48, + "confidence": 0.833 + }, + { + "text": "no", + "start": 74.62, + "end": 74.84, + "confidence": 0.935 + }, + { + "text": "problem.", + "start": 74.84, + "end": 75.03, + "confidence": 0.974 + } + ] + }, + { + "id": 21, + "seek": 5500, + "start": 75.03, + "end": 76.48, + "text": " Okay, no problem.", + "tokens": [ + 51364, + 1033, + 11, + 572, + 1154, + 13, + 51414 + ], + "temperature": 0.2, + "avg_logprob": -0.4537031500189154, + "compression_ratio": 1.6168224299065421, + "no_speech_prob": 0.3397921025753021, + "confidence": 0.839, + "words": [ + { + "text": "Okay,", + "start": 75.03, + "end": 75.78, + "confidence": 0.629 + }, + { + "text": "no", + "start": 75.94, + "end": 76.14, + "confidence": 0.946 + }, + { + "text": "problem.", + "start": 76.14, + "end": 76.48, + "confidence": 0.991 + } + ] + }, + { + "id": 22, + "seek": 5500, + "start": 76.48, + "end": 78.22, + "text": " We'll let you know when the end of the sun.", + "tokens": [ + 51414, + 492, + 603, + 718, + 291, + 458, + 562, + 264, + 917, + 295, + 264, + 3295, + 13, + 51514 + ], + "temperature": 0.2, + "avg_logprob": -0.4537031500189154, + "compression_ratio": 1.6168224299065421, + "no_speech_prob": 0.3397921025753021, + "confidence": 0.607, + "words": [ + { + "text": "We'll", + "start": 76.48, + "end": 76.8, + "confidence": 0.667 + }, + { + "text": "let", + "start": 76.8, + "end": 76.92, + "confidence": 0.949 + }, + { + "text": "you", + "start": 76.92, + "end": 77.08, + "confidence": 0.544 + }, + { + "text": "know", + "start": 77.08, + "end": 77.18, + "confidence": 0.998 + }, + { + "text": "when", + "start": 77.18, + "end": 77.3, + "confidence": 0.533 + }, + { + "text": "the", + "start": 77.3, + "end": 77.4, + "confidence": 0.894 + }, + { + "text": "end", + "start": 77.4, + "end": 77.52, + "confidence": 0.97 + }, + { + "text": "of", + "start": 77.52, + "end": 77.64, + "confidence": 0.976 + }, + { + "text": "the", + "start": 77.64, + "end": 78.02, + "confidence": 0.527 + }, + { + "text": "sun.", + "start": 78.02, + "end": 78.22, + "confidence": 0.075 + } + ] + }, + { + "id": 23, + "seek": 8500, + "start": 85.22, + "end": 85.4, + "text": " Hello.", + "tokens": [ + 50364, + 2425, + 13, + 50414 + ], + "temperature": 0.2, + "avg_logprob": -0.6903002738952637, + "compression_ratio": 0.42857142857142855, + "no_speech_prob": 0.9557693600654602, + "confidence": 0.216, + "words": [ + { + "text": "Hello.", + "start": 85.22, + "end": 85.4, + "confidence": 0.216 + } + ] + } + ], + "language": "en" +} \ No newline at end of file diff --git a/tests/expected/corner_cases/stucked_lm_apollo11.mp3.words.json b/tests/expected/corner_cases/stucked_lm_apollo11.mp3.words.json new file mode 100644 index 0000000000000000000000000000000000000000..ab5aefe27e14ec694737a5182311b067430f6cde --- /dev/null +++ b/tests/expected/corner_cases/stucked_lm_apollo11.mp3.words.json @@ -0,0 +1,3820 @@ +{ + "text": " Apollo 11, Houston we got a recommendation for you on your Soyuz-VA GLEME GVA. Alright, okay, we like to say that they make the one that's on the helmet we're going to have in B1. And you can put the other one on the mic helmet with those GVA blizzard frames. Alright, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them", + "segments": [ + { + "id": 0, + "seek": 0, + "start": 0.52, + "end": 6.54, + "text": " Apollo 11, Houston we got a recommendation for you on your Soyuz-VA GLEME GVA.", + "tokens": [ + 50364, + 25187, + 2975, + 11, + 18717, + 321, + 658, + 257, + 11879, + 337, + 291, + 322, + 428, + 24758, + 3334, + 12, + 20914, + 460, + 2634, + 15454, + 460, + 20914, + 13, + 50714 + ], + "temperature": 0.0, + "avg_logprob": -0.7225757398103413, + "compression_ratio": 1.39247311827957, + "no_speech_prob": 0.44998496770858765, + "confidence": 0.541, + "words": [ + { + "text": "Apollo", + "start": 0.52, + "end": 0.88, + "confidence": 0.155 + }, + { + "text": "11,", + "start": 0.88, + "end": 1.26, + "confidence": 0.977 + }, + { + "text": "Houston", + "start": 1.52, + "end": 1.72, + "confidence": 0.986 + }, + { + "text": "we", + "start": 1.72, + "end": 1.94, + "confidence": 0.518 + }, + { + "text": "got", + "start": 1.94, + "end": 2.1, + "confidence": 0.823 + }, + { + "text": "a", + "start": 2.1, + "end": 2.26, + "confidence": 0.989 + }, + { + "text": "recommendation", + "start": 2.26, + "end": 2.86, + "confidence": 0.968 + }, + { + "text": "for", + "start": 2.86, + "end": 3.44, + "confidence": 0.946 + }, + { + "text": "you", + "start": 3.44, + "end": 3.6, + "confidence": 0.984 + }, + { + "text": "on", + "start": 3.6, + "end": 3.72, + "confidence": 0.909 + }, + { + "text": "your", + "start": 3.72, + "end": 3.92, + "confidence": 0.971 + }, + { + "text": "Soyuz-VA", + "start": 3.92, + "end": 5.16, + "confidence": 0.26 + }, + { + "text": "GLEME", + "start": 5.16, + "end": 5.74, + "confidence": 0.475 + }, + { + "text": "GVA.", + "start": 5.74, + "end": 6.54, + "confidence": 0.435 + } + ] + }, + { + "id": 1, + "seek": 0, + "start": 10.8, + "end": 19.06, + "text": " Alright, okay, we like to say that they make the one that's on the helmet we're going to have in B1.", + "tokens": [ + 50714, + 2798, + 11, + 1392, + 11, + 321, + 411, + 281, + 584, + 300, + 436, + 652, + 264, + 472, + 300, + 311, + 322, + 264, + 15922, + 321, + 434, + 516, + 281, + 362, + 294, + 363, + 16, + 13, + 51314 + ], + "temperature": 0.0, + "avg_logprob": -0.7225757398103413, + "compression_ratio": 1.39247311827957, + "no_speech_prob": 0.44998496770858765, + "confidence": 0.468, + "words": [ + { + "text": "Alright,", + "start": 10.8, + "end": 11.04, + "confidence": 0.31 + }, + { + "text": "okay,", + "start": 11.68, + "end": 12.22, + "confidence": 0.504 + }, + { + "text": "we", + "start": 12.52, + "end": 12.96, + "confidence": 0.609 + }, + { + "text": "like", + "start": 12.96, + "end": 13.28, + "confidence": 0.505 + }, + { + "text": "to", + "start": 13.28, + "end": 13.54, + "confidence": 0.263 + }, + { + "text": "say", + "start": 13.54, + "end": 14.9, + "confidence": 0.138 + }, + { + "text": "that", + "start": 14.9, + "end": 15.38, + "confidence": 0.199 + }, + { + "text": "they", + "start": 15.38, + "end": 15.44, + "confidence": 0.417 + }, + { + "text": "make", + "start": 15.44, + "end": 15.68, + "confidence": 0.402 + }, + { + "text": "the", + "start": 15.68, + "end": 15.84, + "confidence": 0.253 + }, + { + "text": "one", + "start": 15.84, + "end": 16.06, + "confidence": 0.609 + }, + { + "text": "that's", + "start": 16.06, + "end": 16.28, + "confidence": 0.442 + }, + { + "text": "on", + "start": 16.28, + "end": 16.48, + "confidence": 0.595 + }, + { + "text": "the", + "start": 16.48, + "end": 16.78, + "confidence": 0.872 + }, + { + "text": "helmet", + "start": 16.78, + "end": 17.26, + "confidence": 0.856 + }, + { + "text": "we're", + "start": 17.26, + "end": 17.76, + "confidence": 0.299 + }, + { + "text": "going", + "start": 17.76, + "end": 17.92, + "confidence": 0.598 + }, + { + "text": "to", + "start": 17.92, + "end": 18.06, + "confidence": 0.822 + }, + { + "text": "have", + "start": 18.06, + "end": 18.2, + "confidence": 0.835 + }, + { + "text": "in", + "start": 18.2, + "end": 18.36, + "confidence": 0.717 + }, + { + "text": "B1.", + "start": 18.36, + "end": 19.06, + "confidence": 0.764 + } + ] + }, + { + "id": 2, + "seek": 0, + "start": 19.36, + "end": 24.52, + "text": " And you can put the other one on the mic helmet with those GVA blizzard frames.", + "tokens": [ + 51314, + 400, + 291, + 393, + 829, + 264, + 661, + 472, + 322, + 264, + 3123, + 15922, + 365, + 729, + 460, + 20914, + 888, + 31062, + 12083, + 13, + 51614 + ], + "temperature": 0.0, + "avg_logprob": -0.7225757398103413, + "compression_ratio": 1.39247311827957, + "no_speech_prob": 0.44998496770858765, + "confidence": 0.485, + "words": [ + { + "text": "And", + "start": 19.36, + "end": 20.2, + "confidence": 0.668 + }, + { + "text": "you", + "start": 20.2, + "end": 20.32, + "confidence": 0.948 + }, + { + "text": "can", + "start": 20.32, + "end": 20.48, + "confidence": 0.725 + }, + { + "text": "put", + "start": 20.48, + "end": 20.64, + "confidence": 0.98 + }, + { + "text": "the", + "start": 20.64, + "end": 20.84, + "confidence": 0.989 + }, + { + "text": "other", + "start": 20.84, + "end": 21.0, + "confidence": 0.991 + }, + { + "text": "one", + "start": 21.0, + "end": 21.18, + "confidence": 0.978 + }, + { + "text": "on", + "start": 21.18, + "end": 21.4, + "confidence": 0.989 + }, + { + "text": "the", + "start": 21.4, + "end": 21.94, + "confidence": 0.522 + }, + { + "text": "mic", + "start": 21.94, + "end": 22.48, + "confidence": 0.414 + }, + { + "text": "helmet", + "start": 22.48, + "end": 22.8, + "confidence": 0.882 + }, + { + "text": "with", + "start": 22.8, + "end": 23.06, + "confidence": 0.423 + }, + { + "text": "those", + "start": 23.06, + "end": 23.3, + "confidence": 0.466 + }, + { + "text": "GVA", + "start": 23.3, + "end": 23.74, + "confidence": 0.214 + }, + { + "text": "blizzard", + "start": 23.74, + "end": 24.18, + "confidence": 0.108 + }, + { + "text": "frames.", + "start": 24.18, + "end": 24.52, + "confidence": 0.255 + } + ] + }, + { + "id": 3, + "seek": 2500, + "start": 31.34, + "end": 54.98, + "text": " Alright, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them", + "tokens": [ + 50364, + 2798, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552 + ], + "temperature": 0.0, + "avg_logprob": -0.11148937649197048, + "compression_ratio": 24.096774193548388, + "no_speech_prob": 0.4302051365375519, + "confidence": 0.93, + "words": [ + { + "text": "Alright,", + "start": 31.34, + "end": 31.52, + "confidence": 0.066 + }, + { + "text": "got", + "start": 31.82, + "end": 31.84, + "confidence": 0.335 + }, + { + "text": "them,", + "start": 31.84, + "end": 32.12, + "confidence": 0.274 + }, + { + "text": "got", + "start": 32.38, + "end": 32.9, + "confidence": 0.568 + }, + { + "text": "them,", + "start": 32.9, + "end": 33.46, + "confidence": 0.941 + }, + { + "text": "got", + "start": 33.74, + "end": 33.76, + "confidence": 0.581 + }, + { + "text": "them,", + "start": 33.76, + "end": 33.78, + "confidence": 0.925 + }, + { + "text": "got", + "start": 33.78, + "end": 33.8, + "confidence": 0.523 + }, + { + "text": "them,", + "start": 33.8, + "end": 33.9, + "confidence": 0.906 + }, + { + "text": "got", + "start": 34.12, + "end": 34.14, + "confidence": 0.635 + }, + { + "text": "them,", + "start": 34.14, + "end": 34.5, + "confidence": 0.92 + }, + { + "text": "got", + "start": 34.5, + "end": 34.6, + "confidence": 0.688 + }, + { + "text": "them,", + "start": 34.6, + "end": 34.62, + "confidence": 0.946 + }, + { + "text": "got", + "start": 34.62, + "end": 34.64, + "confidence": 0.771 + }, + { + "text": "them,", + "start": 34.64, + "end": 34.66, + "confidence": 0.967 + }, + { + "text": "got", + "start": 34.66, + "end": 34.68, + "confidence": 0.856 + }, + { + "text": "them,", + "start": 34.68, + "end": 34.7, + "confidence": 0.975 + }, + { + "text": "got", + "start": 34.82, + "end": 34.92, + "confidence": 0.868 + }, + { + "text": "them,", + "start": 34.92, + "end": 34.94, + "confidence": 0.981 + }, + { + "text": "got", + "start": 34.94, + "end": 34.96, + "confidence": 0.909 + }, + { + "text": "them,", + "start": 34.96, + "end": 35.1, + "confidence": 0.985 + }, + { + "text": "got", + "start": 35.1, + "end": 35.28, + "confidence": 0.931 + }, + { + "text": "them,", + "start": 35.28, + "end": 35.62, + "confidence": 0.988 + }, + { + "text": "got", + "start": 35.74, + "end": 35.76, + "confidence": 0.945 + }, + { + "text": "them,", + "start": 35.76, + "end": 35.78, + "confidence": 0.988 + }, + { + "text": "got", + "start": 36.0, + "end": 36.02, + "confidence": 0.948 + }, + { + "text": "them,", + "start": 36.02, + "end": 36.04, + "confidence": 0.988 + }, + { + "text": "got", + "start": 36.04, + "end": 36.06, + "confidence": 0.947 + }, + { + "text": "them,", + "start": 36.06, + "end": 36.08, + "confidence": 0.99 + }, + { + "text": "got", + "start": 36.08, + "end": 36.1, + "confidence": 0.948 + }, + { + "text": "them,", + "start": 36.1, + "end": 36.12, + "confidence": 0.991 + }, + { + "text": "got", + "start": 36.12, + "end": 36.14, + "confidence": 0.949 + }, + { + "text": "them,", + "start": 36.14, + "end": 36.16, + "confidence": 0.992 + }, + { + "text": "got", + "start": 36.16, + "end": 36.34, + "confidence": 0.95 + }, + { + "text": "them,", + "start": 36.34, + "end": 36.74, + "confidence": 0.992 + }, + { + "text": "got", + "start": 36.74, + "end": 37.46, + "confidence": 0.952 + }, + { + "text": "them,", + "start": 37.46, + "end": 37.82, + "confidence": 0.991 + }, + { + "text": "got", + "start": 37.82, + "end": 37.84, + "confidence": 0.953 + }, + { + "text": "them,", + "start": 37.84, + "end": 38.12, + "confidence": 0.992 + }, + { + "text": "got", + "start": 38.12, + "end": 38.14, + "confidence": 0.955 + }, + { + "text": "them,", + "start": 38.14, + "end": 38.5, + "confidence": 0.992 + }, + { + "text": "got", + "start": 38.5, + "end": 38.52, + "confidence": 0.957 + }, + { + "text": "them,", + "start": 38.52, + "end": 38.54, + "confidence": 0.992 + }, + { + "text": "got", + "start": 38.54, + "end": 38.56, + "confidence": 0.958 + }, + { + "text": "them,", + "start": 38.56, + "end": 38.58, + "confidence": 0.992 + }, + { + "text": "got", + "start": 38.58, + "end": 38.6, + "confidence": 0.96 + }, + { + "text": "them,", + "start": 38.6, + "end": 38.62, + "confidence": 0.993 + }, + { + "text": "got", + "start": 38.62, + "end": 38.64, + "confidence": 0.961 + }, + { + "text": "them,", + "start": 38.64, + "end": 38.66, + "confidence": 0.993 + }, + { + "text": "got", + "start": 38.66, + "end": 38.68, + "confidence": 0.962 + }, + { + "text": "them,", + "start": 38.68, + "end": 38.7, + "confidence": 0.993 + }, + { + "text": "got", + "start": 38.7, + "end": 38.72, + "confidence": 0.963 + }, + { + "text": "them,", + "start": 38.72, + "end": 38.74, + "confidence": 0.993 + }, + { + "text": "got", + "start": 38.74, + "end": 38.76, + "confidence": 0.963 + }, + { + "text": "them,", + "start": 38.76, + "end": 38.78, + "confidence": 0.993 + }, + { + "text": "got", + "start": 38.78, + "end": 38.8, + "confidence": 0.963 + }, + { + "text": "them,", + "start": 38.8, + "end": 38.82, + "confidence": 0.993 + }, + { + "text": "got", + "start": 38.82, + "end": 38.84, + "confidence": 0.964 + }, + { + "text": "them,", + "start": 38.84, + "end": 38.86, + "confidence": 0.993 + }, + { + "text": "got", + "start": 38.86, + "end": 38.88, + "confidence": 0.964 + }, + { + "text": "them,", + "start": 38.88, + "end": 38.9, + "confidence": 0.993 + }, + { + "text": "got", + "start": 38.9, + "end": 38.92, + "confidence": 0.965 + }, + { + "text": "them,", + "start": 38.92, + "end": 38.94, + "confidence": 0.993 + }, + { + "text": "got", + "start": 38.94, + "end": 38.96, + "confidence": 0.965 + }, + { + "text": "them,", + "start": 38.96, + "end": 38.98, + "confidence": 0.993 + }, + { + "text": "got", + "start": 38.98, + "end": 39.0, + "confidence": 0.967 + }, + { + "text": "them,", + "start": 39.0, + "end": 39.02, + "confidence": 0.993 + }, + { + "text": "got", + "start": 39.02, + "end": 39.04, + "confidence": 0.968 + }, + { + "text": "them,", + "start": 39.04, + "end": 39.06, + "confidence": 0.993 + }, + { + "text": "got", + "start": 39.06, + "end": 39.08, + "confidence": 0.97 + }, + { + "text": "them,", + "start": 39.08, + "end": 39.1, + "confidence": 0.994 + }, + { + "text": "got", + "start": 39.1, + "end": 39.12, + "confidence": 0.97 + }, + { + "text": "them,", + "start": 39.12, + "end": 39.14, + "confidence": 0.994 + }, + { + "text": "got", + "start": 39.14, + "end": 39.16, + "confidence": 0.972 + }, + { + "text": "them,", + "start": 39.16, + "end": 39.18, + "confidence": 0.994 + }, + { + "text": "got", + "start": 39.18, + "end": 39.2, + "confidence": 0.972 + }, + { + "text": "them,", + "start": 39.2, + "end": 39.22, + "confidence": 0.994 + }, + { + "text": "got", + "start": 39.22, + "end": 39.24, + "confidence": 0.974 + }, + { + "text": "them,", + "start": 39.24, + "end": 39.26, + "confidence": 0.994 + }, + { + "text": "got", + "start": 39.26, + "end": 39.28, + "confidence": 0.976 + }, + { + "text": "them,", + "start": 39.28, + "end": 39.3, + "confidence": 0.994 + }, + { + "text": "got", + "start": 39.3, + "end": 39.32, + "confidence": 0.977 + }, + { + "text": "them,", + "start": 39.32, + "end": 39.34, + "confidence": 0.994 + }, + { + "text": "got", + "start": 39.34, + "end": 39.36, + "confidence": 0.978 + }, + { + "text": "them,", + "start": 39.36, + "end": 39.38, + "confidence": 0.995 + }, + { + "text": "got", + "start": 39.38, + "end": 39.4, + "confidence": 0.981 + }, + { + "text": "them,", + "start": 39.4, + "end": 39.42, + "confidence": 0.995 + }, + { + "text": "got", + "start": 39.42, + "end": 39.44, + "confidence": 0.982 + }, + { + "text": "them,", + "start": 39.44, + "end": 39.46, + "confidence": 0.995 + }, + { + "text": "got", + "start": 39.46, + "end": 39.48, + "confidence": 0.983 + }, + { + "text": "them,", + "start": 39.48, + "end": 39.5, + "confidence": 0.995 + }, + { + "text": "got", + "start": 39.5, + "end": 39.52, + "confidence": 0.984 + }, + { + "text": "them,", + "start": 39.52, + "end": 39.54, + "confidence": 0.995 + }, + { + "text": "got", + "start": 39.54, + "end": 39.56, + "confidence": 0.985 + }, + { + "text": "them,", + "start": 39.56, + "end": 39.58, + "confidence": 0.995 + }, + { + "text": "got", + "start": 39.58, + "end": 39.6, + "confidence": 0.986 + }, + { + "text": "them,", + "start": 39.6, + "end": 39.62, + "confidence": 0.995 + }, + { + "text": "got", + "start": 39.62, + "end": 39.64, + "confidence": 0.984 + }, + { + "text": "them,", + "start": 39.64, + "end": 39.66, + "confidence": 0.995 + }, + { + "text": "got", + "start": 39.66, + "end": 39.68, + "confidence": 0.986 + }, + { + "text": "them,", + "start": 39.68, + "end": 39.7, + "confidence": 0.995 + }, + { + "text": "got", + "start": 39.7, + "end": 39.72, + "confidence": 0.987 + }, + { + "text": "them,", + "start": 39.72, + "end": 39.74, + "confidence": 0.995 + }, + { + "text": "got", + "start": 39.74, + "end": 39.76, + "confidence": 0.988 + }, + { + "text": "them,", + "start": 39.76, + "end": 39.78, + "confidence": 0.995 + }, + { + "text": "got", + "start": 39.78, + "end": 39.8, + "confidence": 0.989 + }, + { + "text": "them,", + "start": 39.8, + "end": 39.82, + "confidence": 0.995 + }, + { + "text": "got", + "start": 39.82, + "end": 39.84, + "confidence": 0.989 + }, + { + "text": "them,", + "start": 39.84, + "end": 39.86, + "confidence": 0.995 + }, + { + "text": "got", + "start": 39.86, + "end": 39.88, + "confidence": 0.99 + }, + { + "text": "them,", + "start": 39.88, + "end": 39.9, + "confidence": 0.995 + }, + { + "text": "got", + "start": 39.9, + "end": 39.92, + "confidence": 0.99 + }, + { + "text": "them,", + "start": 39.92, + "end": 39.94, + "confidence": 0.995 + }, + { + "text": "got", + "start": 39.94, + "end": 39.96, + "confidence": 0.991 + }, + { + "text": "them,", + "start": 39.96, + "end": 39.98, + "confidence": 0.995 + }, + { + "text": "got", + "start": 39.98, + "end": 40.0, + "confidence": 0.991 + }, + { + "text": "them,", + "start": 40.0, + "end": 40.02, + "confidence": 0.995 + }, + { + "text": "got", + "start": 40.02, + "end": 40.04, + "confidence": 0.992 + }, + { + "text": "them,", + "start": 40.04, + "end": 40.06, + "confidence": 0.995 + }, + { + "text": "got", + "start": 40.06, + "end": 40.08, + "confidence": 0.992 + }, + { + "text": "them,", + "start": 40.08, + "end": 40.1, + "confidence": 0.995 + }, + { + "text": "got", + "start": 40.1, + "end": 40.12, + "confidence": 0.992 + }, + { + "text": "them,", + "start": 40.12, + "end": 40.14, + "confidence": 0.995 + }, + { + "text": "got", + "start": 40.14, + "end": 40.16, + "confidence": 0.992 + }, + { + "text": "them,", + "start": 40.16, + "end": 40.18, + "confidence": 0.995 + }, + { + "text": "got", + "start": 40.18, + "end": 40.2, + "confidence": 0.993 + }, + { + "text": "them,", + "start": 40.2, + "end": 40.22, + "confidence": 0.995 + }, + { + "text": "got", + "start": 40.22, + "end": 40.46, + "confidence": 0.993 + }, + { + "text": "them,", + "start": 40.46, + "end": 40.76, + "confidence": 0.996 + }, + { + "text": "got", + "start": 41.02, + "end": 41.04, + "confidence": 0.993 + }, + { + "text": "them,", + "start": 41.04, + "end": 41.72, + "confidence": 0.996 + }, + { + "text": "got", + "start": 41.9, + "end": 41.92, + "confidence": 0.994 + }, + { + "text": "them,", + "start": 41.92, + "end": 43.0, + "confidence": 0.996 + }, + { + "text": "got", + "start": 43.0, + "end": 44.06, + "confidence": 0.994 + }, + { + "text": "them,", + "start": 44.06, + "end": 44.88, + "confidence": 0.996 + }, + { + "text": "got", + "start": 44.94, + "end": 45.46, + "confidence": 0.994 + }, + { + "text": "them,", + "start": 45.46, + "end": 45.76, + "confidence": 0.996 + }, + { + "text": "got", + "start": 45.76, + "end": 47.06, + "confidence": 0.995 + }, + { + "text": "them,", + "start": 47.06, + "end": 47.76, + "confidence": 0.996 + }, + { + "text": "got", + "start": 47.82, + "end": 48.5, + "confidence": 0.995 + }, + { + "text": "them,", + "start": 48.5, + "end": 48.9, + "confidence": 0.996 + }, + { + "text": "got", + "start": 48.9, + "end": 49.2, + "confidence": 0.995 + }, + { + "text": "them,", + "start": 49.2, + "end": 50.8, + "confidence": 0.996 + }, + { + "text": "got", + "start": 51.18, + "end": 51.74, + "confidence": 0.995 + }, + { + "text": "them,", + "start": 51.74, + "end": 52.38, + "confidence": 0.997 + }, + { + "text": "got", + "start": 52.44, + "end": 53.26, + "confidence": 0.995 + }, + { + "text": "them,", + "start": 53.26, + "end": 53.74, + "confidence": 0.997 + }, + { + "text": "got", + "start": 53.76, + "end": 54.2, + "confidence": 0.995 + }, + { + "text": "them", + "start": 54.2, + "end": 54.98, + "confidence": 0.997 + } + ] + }, + { + "id": 4, + "seek": 5500, + "start": 55.0, + "end": 85.0, + "text": " got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them", + "tokens": [ + 50364, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552 + ], + "temperature": 0.0, + "avg_logprob": -0.05314932168866487, + "compression_ratio": 29.52, + "no_speech_prob": 0.2454655021429062, + "confidence": 0.948, + "words": [ + { + "text": "got", + "start": 55.0, + "end": 55.1, + "confidence": 0.213 + }, + { + "text": "them,", + "start": 55.1, + "end": 55.12, + "confidence": 0.95 + }, + { + "text": "got", + "start": 55.16, + "end": 55.18, + "confidence": 0.955 + }, + { + "text": "them,", + "start": 55.18, + "end": 55.5, + "confidence": 0.997 + }, + { + "text": "got", + "start": 55.56, + "end": 57.36, + "confidence": 0.963 + }, + { + "text": "them,", + "start": 57.36, + "end": 57.52, + "confidence": 0.997 + }, + { + "text": "got", + "start": 57.58, + "end": 57.68, + "confidence": 0.957 + }, + { + "text": "them,", + "start": 57.68, + "end": 57.7, + "confidence": 0.997 + }, + { + "text": "got", + "start": 57.7, + "end": 57.72, + "confidence": 0.938 + }, + { + "text": "them,", + "start": 57.72, + "end": 57.74, + "confidence": 0.993 + }, + { + "text": "got", + "start": 57.74, + "end": 57.76, + "confidence": 0.912 + }, + { + "text": "them,", + "start": 57.76, + "end": 57.78, + "confidence": 0.988 + }, + { + "text": "got", + "start": 57.78, + "end": 57.8, + "confidence": 0.872 + }, + { + "text": "them,", + "start": 57.8, + "end": 57.82, + "confidence": 0.982 + }, + { + "text": "got", + "start": 57.82, + "end": 57.84, + "confidence": 0.862 + }, + { + "text": "them,", + "start": 57.84, + "end": 57.86, + "confidence": 0.984 + }, + { + "text": "got", + "start": 57.86, + "end": 57.88, + "confidence": 0.888 + }, + { + "text": "them,", + "start": 57.88, + "end": 57.9, + "confidence": 0.983 + }, + { + "text": "got", + "start": 57.9, + "end": 58.98, + "confidence": 0.85 + }, + { + "text": "them,", + "start": 58.98, + "end": 59.22, + "confidence": 0.924 + }, + { + "text": "got", + "start": 60.5, + "end": 61.26, + "confidence": 0.56 + }, + { + "text": "them,", + "start": 61.26, + "end": 61.94, + "confidence": 0.958 + }, + { + "text": "got", + "start": 61.94, + "end": 61.96, + "confidence": 0.81 + }, + { + "text": "them,", + "start": 61.96, + "end": 61.98, + "confidence": 0.976 + }, + { + "text": "got", + "start": 61.98, + "end": 62.0, + "confidence": 0.842 + }, + { + "text": "them,", + "start": 62.0, + "end": 62.02, + "confidence": 0.977 + }, + { + "text": "got", + "start": 62.02, + "end": 62.04, + "confidence": 0.835 + }, + { + "text": "them,", + "start": 62.04, + "end": 62.06, + "confidence": 0.977 + }, + { + "text": "got", + "start": 62.06, + "end": 62.08, + "confidence": 0.835 + }, + { + "text": "them,", + "start": 62.08, + "end": 62.1, + "confidence": 0.979 + }, + { + "text": "got", + "start": 62.1, + "end": 62.12, + "confidence": 0.853 + }, + { + "text": "them,", + "start": 62.12, + "end": 62.14, + "confidence": 0.983 + }, + { + "text": "got", + "start": 62.14, + "end": 62.16, + "confidence": 0.875 + }, + { + "text": "them,", + "start": 62.16, + "end": 62.18, + "confidence": 0.986 + }, + { + "text": "got", + "start": 62.18, + "end": 62.2, + "confidence": 0.892 + }, + { + "text": "them,", + "start": 62.2, + "end": 62.22, + "confidence": 0.985 + }, + { + "text": "got", + "start": 62.22, + "end": 62.24, + "confidence": 0.884 + }, + { + "text": "them,", + "start": 62.24, + "end": 62.26, + "confidence": 0.985 + }, + { + "text": "got", + "start": 62.26, + "end": 62.28, + "confidence": 0.877 + }, + { + "text": "them,", + "start": 62.28, + "end": 62.3, + "confidence": 0.986 + }, + { + "text": "got", + "start": 62.3, + "end": 62.32, + "confidence": 0.874 + }, + { + "text": "them,", + "start": 62.32, + "end": 62.34, + "confidence": 0.987 + }, + { + "text": "got", + "start": 62.34, + "end": 62.36, + "confidence": 0.871 + }, + { + "text": "them,", + "start": 62.36, + "end": 62.38, + "confidence": 0.987 + }, + { + "text": "got", + "start": 62.38, + "end": 62.4, + "confidence": 0.88 + }, + { + "text": "them,", + "start": 62.4, + "end": 62.42, + "confidence": 0.988 + }, + { + "text": "got", + "start": 62.44, + "end": 62.46, + "confidence": 0.883 + }, + { + "text": "them,", + "start": 62.46, + "end": 62.48, + "confidence": 0.989 + }, + { + "text": "got", + "start": 62.54, + "end": 62.78, + "confidence": 0.889 + }, + { + "text": "them,", + "start": 62.78, + "end": 62.8, + "confidence": 0.989 + }, + { + "text": "got", + "start": 62.8, + "end": 62.82, + "confidence": 0.894 + }, + { + "text": "them,", + "start": 62.82, + "end": 62.84, + "confidence": 0.99 + }, + { + "text": "got", + "start": 62.84, + "end": 62.86, + "confidence": 0.902 + }, + { + "text": "them,", + "start": 62.86, + "end": 62.88, + "confidence": 0.99 + }, + { + "text": "got", + "start": 62.88, + "end": 62.9, + "confidence": 0.904 + }, + { + "text": "them,", + "start": 62.9, + "end": 62.92, + "confidence": 0.99 + }, + { + "text": "got", + "start": 62.92, + "end": 62.94, + "confidence": 0.91 + }, + { + "text": "them,", + "start": 62.94, + "end": 62.96, + "confidence": 0.991 + }, + { + "text": "got", + "start": 62.96, + "end": 62.98, + "confidence": 0.916 + }, + { + "text": "them,", + "start": 62.98, + "end": 63.0, + "confidence": 0.991 + }, + { + "text": "got", + "start": 63.0, + "end": 63.02, + "confidence": 0.918 + }, + { + "text": "them,", + "start": 63.02, + "end": 63.04, + "confidence": 0.992 + }, + { + "text": "got", + "start": 63.04, + "end": 63.06, + "confidence": 0.923 + }, + { + "text": "them,", + "start": 63.06, + "end": 63.08, + "confidence": 0.992 + }, + { + "text": "got", + "start": 63.08, + "end": 63.1, + "confidence": 0.93 + }, + { + "text": "them,", + "start": 63.1, + "end": 63.12, + "confidence": 0.992 + }, + { + "text": "got", + "start": 63.12, + "end": 63.14, + "confidence": 0.932 + }, + { + "text": "them,", + "start": 63.14, + "end": 63.16, + "confidence": 0.992 + }, + { + "text": "got", + "start": 63.16, + "end": 63.18, + "confidence": 0.938 + }, + { + "text": "them,", + "start": 63.18, + "end": 63.2, + "confidence": 0.992 + }, + { + "text": "got", + "start": 63.2, + "end": 63.22, + "confidence": 0.943 + }, + { + "text": "them,", + "start": 63.22, + "end": 63.24, + "confidence": 0.992 + }, + { + "text": "got", + "start": 63.24, + "end": 63.26, + "confidence": 0.945 + }, + { + "text": "them,", + "start": 63.26, + "end": 63.28, + "confidence": 0.993 + }, + { + "text": "got", + "start": 63.28, + "end": 63.3, + "confidence": 0.949 + }, + { + "text": "them,", + "start": 63.3, + "end": 63.32, + "confidence": 0.992 + }, + { + "text": "got", + "start": 63.32, + "end": 63.34, + "confidence": 0.954 + }, + { + "text": "them,", + "start": 63.34, + "end": 63.36, + "confidence": 0.993 + }, + { + "text": "got", + "start": 63.36, + "end": 63.38, + "confidence": 0.954 + }, + { + "text": "them,", + "start": 63.38, + "end": 63.4, + "confidence": 0.992 + }, + { + "text": "got", + "start": 63.4, + "end": 63.46, + "confidence": 0.956 + }, + { + "text": "them,", + "start": 63.46, + "end": 63.64, + "confidence": 0.992 + }, + { + "text": "got", + "start": 63.64, + "end": 63.68, + "confidence": 0.96 + }, + { + "text": "them,", + "start": 63.68, + "end": 63.7, + "confidence": 0.993 + }, + { + "text": "got", + "start": 63.7, + "end": 63.72, + "confidence": 0.961 + }, + { + "text": "them,", + "start": 63.72, + "end": 63.74, + "confidence": 0.992 + }, + { + "text": "got", + "start": 63.74, + "end": 63.76, + "confidence": 0.96 + }, + { + "text": "them,", + "start": 63.76, + "end": 63.78, + "confidence": 0.992 + }, + { + "text": "got", + "start": 63.78, + "end": 63.8, + "confidence": 0.963 + }, + { + "text": "them,", + "start": 63.8, + "end": 63.82, + "confidence": 0.992 + }, + { + "text": "got", + "start": 63.82, + "end": 63.84, + "confidence": 0.964 + }, + { + "text": "them,", + "start": 63.84, + "end": 64.42, + "confidence": 0.992 + }, + { + "text": "got", + "start": 64.46, + "end": 64.58, + "confidence": 0.967 + }, + { + "text": "them,", + "start": 64.58, + "end": 64.64, + "confidence": 0.993 + }, + { + "text": "got", + "start": 64.72, + "end": 65.06, + "confidence": 0.967 + }, + { + "text": "them,", + "start": 65.06, + "end": 65.22, + "confidence": 0.992 + }, + { + "text": "got", + "start": 65.22, + "end": 66.0, + "confidence": 0.968 + }, + { + "text": "them,", + "start": 66.0, + "end": 66.2, + "confidence": 0.992 + }, + { + "text": "got", + "start": 66.38, + "end": 67.34, + "confidence": 0.97 + }, + { + "text": "them,", + "start": 67.34, + "end": 67.44, + "confidence": 0.992 + }, + { + "text": "got", + "start": 67.48, + "end": 67.5, + "confidence": 0.97 + }, + { + "text": "them,", + "start": 67.5, + "end": 67.52, + "confidence": 0.993 + }, + { + "text": "got", + "start": 67.52, + "end": 67.54, + "confidence": 0.972 + }, + { + "text": "them,", + "start": 67.54, + "end": 67.56, + "confidence": 0.992 + }, + { + "text": "got", + "start": 67.56, + "end": 67.58, + "confidence": 0.973 + }, + { + "text": "them,", + "start": 67.58, + "end": 67.6, + "confidence": 0.992 + }, + { + "text": "got", + "start": 67.6, + "end": 67.62, + "confidence": 0.973 + }, + { + "text": "them,", + "start": 67.62, + "end": 67.64, + "confidence": 0.992 + }, + { + "text": "got", + "start": 67.68, + "end": 67.7, + "confidence": 0.973 + }, + { + "text": "them,", + "start": 67.7, + "end": 67.72, + "confidence": 0.992 + }, + { + "text": "got", + "start": 67.72, + "end": 67.74, + "confidence": 0.974 + }, + { + "text": "them,", + "start": 67.74, + "end": 67.86, + "confidence": 0.992 + }, + { + "text": "got", + "start": 68.12, + "end": 68.36, + "confidence": 0.974 + }, + { + "text": "them,", + "start": 68.36, + "end": 68.38, + "confidence": 0.992 + }, + { + "text": "got", + "start": 68.56, + "end": 68.58, + "confidence": 0.974 + }, + { + "text": "them,", + "start": 68.58, + "end": 68.6, + "confidence": 0.992 + }, + { + "text": "got", + "start": 68.6, + "end": 68.8, + "confidence": 0.975 + }, + { + "text": "them,", + "start": 68.8, + "end": 69.12, + "confidence": 0.992 + }, + { + "text": "got", + "start": 69.26, + "end": 69.28, + "confidence": 0.975 + }, + { + "text": "them,", + "start": 69.28, + "end": 69.44, + "confidence": 0.992 + }, + { + "text": "got", + "start": 69.84, + "end": 69.86, + "confidence": 0.975 + }, + { + "text": "them,", + "start": 69.86, + "end": 70.02, + "confidence": 0.992 + }, + { + "text": "got", + "start": 70.2, + "end": 70.5, + "confidence": 0.976 + }, + { + "text": "them,", + "start": 70.5, + "end": 71.42, + "confidence": 0.993 + }, + { + "text": "got", + "start": 71.56, + "end": 71.58, + "confidence": 0.977 + }, + { + "text": "them,", + "start": 71.58, + "end": 71.94, + "confidence": 0.993 + }, + { + "text": "got", + "start": 71.94, + "end": 72.1, + "confidence": 0.977 + }, + { + "text": "them,", + "start": 72.1, + "end": 72.82, + "confidence": 0.993 + }, + { + "text": "got", + "start": 72.82, + "end": 74.48, + "confidence": 0.978 + }, + { + "text": "them,", + "start": 74.48, + "end": 74.66, + "confidence": 0.993 + }, + { + "text": "got", + "start": 74.74, + "end": 74.88, + "confidence": 0.978 + }, + { + "text": "them,", + "start": 74.88, + "end": 74.9, + "confidence": 0.993 + }, + { + "text": "got", + "start": 74.92, + "end": 74.94, + "confidence": 0.978 + }, + { + "text": "them,", + "start": 74.94, + "end": 74.96, + "confidence": 0.993 + }, + { + "text": "got", + "start": 75.12, + "end": 75.14, + "confidence": 0.978 + }, + { + "text": "them,", + "start": 75.14, + "end": 75.24, + "confidence": 0.993 + }, + { + "text": "got", + "start": 75.24, + "end": 75.78, + "confidence": 0.98 + }, + { + "text": "them,", + "start": 75.78, + "end": 76.02, + "confidence": 0.993 + }, + { + "text": "got", + "start": 76.02, + "end": 76.4, + "confidence": 0.981 + }, + { + "text": "them,", + "start": 76.4, + "end": 76.6, + "confidence": 0.993 + }, + { + "text": "got", + "start": 76.6, + "end": 76.82, + "confidence": 0.98 + }, + { + "text": "them,", + "start": 76.82, + "end": 77.76, + "confidence": 0.993 + }, + { + "text": "got", + "start": 78.22, + "end": 78.24, + "confidence": 0.98 + }, + { + "text": "them,", + "start": 78.24, + "end": 78.42, + "confidence": 0.993 + }, + { + "text": "got", + "start": 80.0, + "end": 80.02, + "confidence": 0.98 + }, + { + "text": "them,", + "start": 80.02, + "end": 82.6, + "confidence": 0.993 + }, + { + "text": "got", + "start": 82.6, + "end": 84.98, + "confidence": 0.98 + }, + { + "text": "them", + "start": 84.98, + "end": 85.0, + "confidence": 0.994 + } + ] + }, + { + "id": 5, + "seek": 8500, + "start": 85.0, + "end": 115.0, + "text": " got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them", + "tokens": [ + 50364, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552 + ], + "temperature": 0.0, + "avg_logprob": -0.042715128227199674, + "compression_ratio": 29.52, + "no_speech_prob": 0.6358686685562134, + "confidence": 0.953, + "words": [ + { + "text": "got", + "start": 85.0, + "end": 85.4, + "confidence": 0.455 + }, + { + "text": "them,", + "start": 85.4, + "end": 85.58, + "confidence": 0.951 + }, + { + "text": "got", + "start": 86.12, + "end": 86.72, + "confidence": 0.965 + }, + { + "text": "them,", + "start": 86.72, + "end": 87.12, + "confidence": 0.992 + }, + { + "text": "got", + "start": 87.24, + "end": 87.56, + "confidence": 0.964 + }, + { + "text": "them,", + "start": 87.56, + "end": 87.94, + "confidence": 0.994 + }, + { + "text": "got", + "start": 88.08, + "end": 88.48, + "confidence": 0.955 + }, + { + "text": "them,", + "start": 88.48, + "end": 88.5, + "confidence": 0.992 + }, + { + "text": "got", + "start": 88.5, + "end": 88.9, + "confidence": 0.94 + }, + { + "text": "them,", + "start": 88.9, + "end": 89.02, + "confidence": 0.99 + }, + { + "text": "got", + "start": 89.06, + "end": 89.08, + "confidence": 0.92 + }, + { + "text": "them,", + "start": 89.08, + "end": 89.1, + "confidence": 0.989 + }, + { + "text": "got", + "start": 89.1, + "end": 89.12, + "confidence": 0.908 + }, + { + "text": "them,", + "start": 89.12, + "end": 89.14, + "confidence": 0.987 + }, + { + "text": "got", + "start": 89.58, + "end": 89.6, + "confidence": 0.907 + }, + { + "text": "them,", + "start": 89.6, + "end": 89.62, + "confidence": 0.986 + }, + { + "text": "got", + "start": 90.06, + "end": 90.08, + "confidence": 0.915 + }, + { + "text": "them,", + "start": 90.08, + "end": 90.1, + "confidence": 0.982 + }, + { + "text": "got", + "start": 90.68, + "end": 90.7, + "confidence": 0.91 + }, + { + "text": "them,", + "start": 90.7, + "end": 90.72, + "confidence": 0.972 + }, + { + "text": "got", + "start": 91.88, + "end": 91.9, + "confidence": 0.856 + }, + { + "text": "them,", + "start": 91.9, + "end": 91.92, + "confidence": 0.965 + }, + { + "text": "got", + "start": 91.92, + "end": 91.94, + "confidence": 0.831 + }, + { + "text": "them,", + "start": 91.94, + "end": 91.96, + "confidence": 0.968 + }, + { + "text": "got", + "start": 91.96, + "end": 91.98, + "confidence": 0.855 + }, + { + "text": "them,", + "start": 91.98, + "end": 92.0, + "confidence": 0.97 + }, + { + "text": "got", + "start": 92.0, + "end": 92.02, + "confidence": 0.879 + }, + { + "text": "them,", + "start": 92.02, + "end": 92.04, + "confidence": 0.97 + }, + { + "text": "got", + "start": 92.04, + "end": 92.06, + "confidence": 0.889 + }, + { + "text": "them,", + "start": 92.06, + "end": 92.08, + "confidence": 0.97 + }, + { + "text": "got", + "start": 92.08, + "end": 92.1, + "confidence": 0.892 + }, + { + "text": "them,", + "start": 92.1, + "end": 92.12, + "confidence": 0.97 + }, + { + "text": "got", + "start": 92.12, + "end": 92.14, + "confidence": 0.884 + }, + { + "text": "them,", + "start": 92.14, + "end": 92.16, + "confidence": 0.972 + }, + { + "text": "got", + "start": 92.16, + "end": 92.18, + "confidence": 0.882 + }, + { + "text": "them,", + "start": 92.18, + "end": 92.2, + "confidence": 0.972 + }, + { + "text": "got", + "start": 92.2, + "end": 92.22, + "confidence": 0.88 + }, + { + "text": "them,", + "start": 92.22, + "end": 92.24, + "confidence": 0.97 + }, + { + "text": "got", + "start": 92.24, + "end": 92.26, + "confidence": 0.879 + }, + { + "text": "them,", + "start": 92.26, + "end": 92.28, + "confidence": 0.97 + }, + { + "text": "got", + "start": 92.28, + "end": 92.3, + "confidence": 0.878 + }, + { + "text": "them,", + "start": 92.3, + "end": 92.32, + "confidence": 0.971 + }, + { + "text": "got", + "start": 92.32, + "end": 92.34, + "confidence": 0.874 + }, + { + "text": "them,", + "start": 92.34, + "end": 92.36, + "confidence": 0.971 + }, + { + "text": "got", + "start": 92.36, + "end": 92.38, + "confidence": 0.882 + }, + { + "text": "them,", + "start": 92.38, + "end": 92.4, + "confidence": 0.973 + }, + { + "text": "got", + "start": 92.4, + "end": 92.42, + "confidence": 0.881 + }, + { + "text": "them,", + "start": 92.42, + "end": 92.44, + "confidence": 0.973 + }, + { + "text": "got", + "start": 92.44, + "end": 92.46, + "confidence": 0.881 + }, + { + "text": "them,", + "start": 92.46, + "end": 92.48, + "confidence": 0.975 + }, + { + "text": "got", + "start": 92.48, + "end": 92.5, + "confidence": 0.885 + }, + { + "text": "them,", + "start": 92.5, + "end": 92.52, + "confidence": 0.976 + }, + { + "text": "got", + "start": 92.52, + "end": 92.54, + "confidence": 0.888 + }, + { + "text": "them,", + "start": 92.54, + "end": 92.56, + "confidence": 0.977 + }, + { + "text": "got", + "start": 92.56, + "end": 92.58, + "confidence": 0.888 + }, + { + "text": "them,", + "start": 92.58, + "end": 92.6, + "confidence": 0.978 + }, + { + "text": "got", + "start": 92.6, + "end": 92.62, + "confidence": 0.892 + }, + { + "text": "them,", + "start": 92.62, + "end": 92.64, + "confidence": 0.978 + }, + { + "text": "got", + "start": 92.64, + "end": 92.66, + "confidence": 0.896 + }, + { + "text": "them,", + "start": 92.66, + "end": 92.68, + "confidence": 0.979 + }, + { + "text": "got", + "start": 92.68, + "end": 92.7, + "confidence": 0.895 + }, + { + "text": "them,", + "start": 92.7, + "end": 92.72, + "confidence": 0.98 + }, + { + "text": "got", + "start": 92.72, + "end": 92.74, + "confidence": 0.897 + }, + { + "text": "them,", + "start": 92.74, + "end": 92.76, + "confidence": 0.981 + }, + { + "text": "got", + "start": 92.76, + "end": 92.78, + "confidence": 0.906 + }, + { + "text": "them,", + "start": 92.78, + "end": 92.8, + "confidence": 0.982 + }, + { + "text": "got", + "start": 92.8, + "end": 92.82, + "confidence": 0.906 + }, + { + "text": "them,", + "start": 92.82, + "end": 92.84, + "confidence": 0.983 + }, + { + "text": "got", + "start": 92.84, + "end": 92.86, + "confidence": 0.911 + }, + { + "text": "them,", + "start": 92.86, + "end": 92.88, + "confidence": 0.983 + }, + { + "text": "got", + "start": 92.88, + "end": 92.9, + "confidence": 0.917 + }, + { + "text": "them,", + "start": 92.9, + "end": 92.92, + "confidence": 0.984 + }, + { + "text": "got", + "start": 92.92, + "end": 92.94, + "confidence": 0.916 + }, + { + "text": "them,", + "start": 92.94, + "end": 92.96, + "confidence": 0.985 + }, + { + "text": "got", + "start": 92.96, + "end": 92.98, + "confidence": 0.924 + }, + { + "text": "them,", + "start": 92.98, + "end": 93.0, + "confidence": 0.986 + }, + { + "text": "got", + "start": 93.26, + "end": 93.28, + "confidence": 0.929 + }, + { + "text": "them,", + "start": 93.28, + "end": 93.3, + "confidence": 0.987 + }, + { + "text": "got", + "start": 93.3, + "end": 93.32, + "confidence": 0.931 + }, + { + "text": "them,", + "start": 93.32, + "end": 93.34, + "confidence": 0.987 + }, + { + "text": "got", + "start": 93.34, + "end": 93.36, + "confidence": 0.934 + }, + { + "text": "them,", + "start": 93.36, + "end": 93.38, + "confidence": 0.988 + }, + { + "text": "got", + "start": 93.38, + "end": 93.4, + "confidence": 0.94 + }, + { + "text": "them,", + "start": 93.4, + "end": 93.42, + "confidence": 0.989 + }, + { + "text": "got", + "start": 94.02, + "end": 96.72, + "confidence": 0.943 + }, + { + "text": "them,", + "start": 96.72, + "end": 96.74, + "confidence": 0.99 + }, + { + "text": "got", + "start": 96.74, + "end": 96.76, + "confidence": 0.942 + }, + { + "text": "them,", + "start": 96.76, + "end": 96.78, + "confidence": 0.99 + }, + { + "text": "got", + "start": 96.78, + "end": 96.8, + "confidence": 0.947 + }, + { + "text": "them,", + "start": 96.8, + "end": 96.82, + "confidence": 0.991 + }, + { + "text": "got", + "start": 96.82, + "end": 96.84, + "confidence": 0.952 + }, + { + "text": "them,", + "start": 96.84, + "end": 96.86, + "confidence": 0.991 + }, + { + "text": "got", + "start": 96.86, + "end": 96.88, + "confidence": 0.956 + }, + { + "text": "them,", + "start": 96.88, + "end": 96.9, + "confidence": 0.992 + }, + { + "text": "got", + "start": 96.9, + "end": 99.68, + "confidence": 0.956 + }, + { + "text": "them,", + "start": 99.68, + "end": 99.7, + "confidence": 0.992 + }, + { + "text": "got", + "start": 99.78, + "end": 99.8, + "confidence": 0.959 + }, + { + "text": "them,", + "start": 99.8, + "end": 100.0, + "confidence": 0.993 + }, + { + "text": "got", + "start": 100.66, + "end": 100.68, + "confidence": 0.962 + }, + { + "text": "them,", + "start": 100.68, + "end": 101.44, + "confidence": 0.993 + }, + { + "text": "got", + "start": 101.48, + "end": 101.5, + "confidence": 0.962 + }, + { + "text": "them,", + "start": 101.5, + "end": 101.52, + "confidence": 0.994 + }, + { + "text": "got", + "start": 101.52, + "end": 101.54, + "confidence": 0.966 + }, + { + "text": "them,", + "start": 101.54, + "end": 101.56, + "confidence": 0.994 + }, + { + "text": "got", + "start": 101.56, + "end": 101.58, + "confidence": 0.968 + }, + { + "text": "them,", + "start": 101.58, + "end": 101.6, + "confidence": 0.994 + }, + { + "text": "got", + "start": 101.6, + "end": 101.62, + "confidence": 0.969 + }, + { + "text": "them,", + "start": 101.62, + "end": 101.64, + "confidence": 0.994 + }, + { + "text": "got", + "start": 101.64, + "end": 101.66, + "confidence": 0.971 + }, + { + "text": "them,", + "start": 101.66, + "end": 101.68, + "confidence": 0.995 + }, + { + "text": "got", + "start": 101.68, + "end": 101.7, + "confidence": 0.972 + }, + { + "text": "them,", + "start": 101.7, + "end": 101.72, + "confidence": 0.995 + }, + { + "text": "got", + "start": 101.72, + "end": 101.74, + "confidence": 0.971 + }, + { + "text": "them,", + "start": 101.74, + "end": 101.88, + "confidence": 0.995 + }, + { + "text": "got", + "start": 101.88, + "end": 101.9, + "confidence": 0.973 + }, + { + "text": "them,", + "start": 101.9, + "end": 101.92, + "confidence": 0.995 + }, + { + "text": "got", + "start": 101.92, + "end": 101.94, + "confidence": 0.975 + }, + { + "text": "them,", + "start": 101.94, + "end": 101.96, + "confidence": 0.996 + }, + { + "text": "got", + "start": 101.96, + "end": 101.98, + "confidence": 0.975 + }, + { + "text": "them,", + "start": 101.98, + "end": 102.0, + "confidence": 0.996 + }, + { + "text": "got", + "start": 102.0, + "end": 102.02, + "confidence": 0.976 + }, + { + "text": "them,", + "start": 102.02, + "end": 102.04, + "confidence": 0.996 + }, + { + "text": "got", + "start": 102.04, + "end": 102.06, + "confidence": 0.978 + }, + { + "text": "them,", + "start": 102.06, + "end": 102.08, + "confidence": 0.996 + }, + { + "text": "got", + "start": 102.08, + "end": 102.1, + "confidence": 0.979 + }, + { + "text": "them,", + "start": 102.1, + "end": 102.12, + "confidence": 0.996 + }, + { + "text": "got", + "start": 102.12, + "end": 102.14, + "confidence": 0.98 + }, + { + "text": "them,", + "start": 102.14, + "end": 102.18, + "confidence": 0.996 + }, + { + "text": "got", + "start": 102.18, + "end": 102.2, + "confidence": 0.981 + }, + { + "text": "them,", + "start": 102.2, + "end": 102.22, + "confidence": 0.996 + }, + { + "text": "got", + "start": 102.22, + "end": 102.24, + "confidence": 0.98 + }, + { + "text": "them,", + "start": 102.24, + "end": 102.26, + "confidence": 0.996 + }, + { + "text": "got", + "start": 102.26, + "end": 102.28, + "confidence": 0.981 + }, + { + "text": "them,", + "start": 102.28, + "end": 102.3, + "confidence": 0.996 + }, + { + "text": "got", + "start": 102.3, + "end": 102.32, + "confidence": 0.981 + }, + { + "text": "them,", + "start": 102.32, + "end": 102.34, + "confidence": 0.996 + }, + { + "text": "got", + "start": 102.34, + "end": 102.36, + "confidence": 0.983 + }, + { + "text": "them,", + "start": 102.36, + "end": 103.8, + "confidence": 0.997 + }, + { + "text": "got", + "start": 103.8, + "end": 103.82, + "confidence": 0.983 + }, + { + "text": "them,", + "start": 103.82, + "end": 105.08, + "confidence": 0.997 + }, + { + "text": "got", + "start": 105.08, + "end": 105.1, + "confidence": 0.984 + }, + { + "text": "them,", + "start": 105.1, + "end": 110.38, + "confidence": 0.997 + }, + { + "text": "got", + "start": 110.38, + "end": 110.4, + "confidence": 0.985 + }, + { + "text": "them,", + "start": 110.4, + "end": 111.78, + "confidence": 0.997 + }, + { + "text": "got", + "start": 111.78, + "end": 111.8, + "confidence": 0.985 + }, + { + "text": "them,", + "start": 111.8, + "end": 114.74, + "confidence": 0.997 + }, + { + "text": "got", + "start": 114.74, + "end": 114.98, + "confidence": 0.985 + }, + { + "text": "them", + "start": 114.98, + "end": 115.0, + "confidence": 0.997 + } + ] + } + ], + "language": "en" +} \ No newline at end of file diff --git a/tests/expected/medium_auto.cpu/empty.mp3.words.json b/tests/expected/medium_auto.cpu/empty.mp3.words.json new file mode 100644 index 0000000000000000000000000000000000000000..4343ff36131a9ff2cd0f90ee1eb0dcace7c2c1e4 --- /dev/null +++ b/tests/expected/medium_auto.cpu/empty.mp3.words.json @@ -0,0 +1,46 @@ +{ + "text": " Thanks for watching!", + "segments": [ + { + "id": 0, + "seek": 0, + "start": 0.02, + "end": 3.06, + "text": " Thanks for watching!", + "tokens": [ + 50364, + 2561, + 337, + 1976, + 0, + 50514 + ], + "temperature": 0.0, + "avg_logprob": -0.8994035720825195, + "compression_ratio": 0.7142857142857143, + "no_speech_prob": 0.6661779880523682, + "confidence": 0.373, + "words": [ + { + "text": "Thanks", + "start": 0.02, + "end": 0.44, + "confidence": 0.06 + }, + { + "text": "for", + "start": 0.44, + "end": 1.02, + "confidence": 0.916 + }, + { + "text": "watching!", + "start": 1.02, + "end": 3.06, + "confidence": 0.936 + } + ] + } + ], + "language": "en" +} \ No newline at end of file diff --git a/tests/expected/medium_auto.cpu/radio_short.mp3.words.json b/tests/expected/medium_auto.cpu/radio_short.mp3.words.json new file mode 100644 index 0000000000000000000000000000000000000000..b5ad9acab69d8c24acd10bd904b99b423c6c97ec --- /dev/null +++ b/tests/expected/medium_auto.cpu/radio_short.mp3.words.json @@ -0,0 +1,1616 @@ +{ + "text": "3212122222222211111111111111111111111111111111111111111111111111111111", + "segments": [ + { + "id": 0, + "seek": 0, + "start": 0.04, + "end": 0.64, + "text": "3", + "tokens": [ + 18 + ], + "temperature": 0.0, + "avg_logprob": -0.28690400990572845, + "compression_ratio": 1.0, + "no_speech_prob": 0.8406417965888977, + "confidence": 0.029, + "words": [ + { + "text": "3", + "start": 0.04, + "end": 0.64, + "confidence": 0.029 + } + ] + }, + { + "id": 1, + "seek": 0, + "start": 1.52, + "end": 3.0, + "text": "2", + "tokens": [ + 17 + ], + "temperature": 0.0, + "avg_logprob": -0.28690400990572845, + "compression_ratio": 1.0, + "no_speech_prob": 0.8406417965888977, + "confidence": 0.688, + "words": [ + { + "text": "2", + "start": 1.52, + "end": 3.0, + "confidence": 0.688 + } + ] + }, + { + "id": 2, + "seek": 0, + "start": 3.68, + "end": 5.32, + "text": "1", + "tokens": [ + 16 + ], + "temperature": 0.0, + "avg_logprob": -0.28690400990572845, + "compression_ratio": 1.0, + "no_speech_prob": 0.8406417965888977, + "confidence": 0.95, + "words": [ + { + "text": "1", + "start": 3.68, + "end": 5.32, + "confidence": 0.95 + } + ] + }, + { + "id": 3, + "seek": 0, + "start": 6.5, + "end": 7.02, + "text": "2", + "tokens": [ + 17 + ], + "temperature": 0.0, + "avg_logprob": -0.28690400990572845, + "compression_ratio": 1.0, + "no_speech_prob": 0.8406417965888977, + "confidence": 0.278, + "words": [ + { + "text": "2", + "start": 6.5, + "end": 7.02, + "confidence": 0.278 + } + ] + }, + { + "id": 4, + "seek": 0, + "start": 8.08, + "end": 9.68, + "text": "1", + "tokens": [ + 16 + ], + "temperature": 0.0, + "avg_logprob": -0.28690400990572845, + "compression_ratio": 1.0, + "no_speech_prob": 0.8406417965888977, + "confidence": 0.702, + "words": [ + { + "text": "1", + "start": 8.08, + "end": 9.68, + "confidence": 0.702 + } + ] + }, + { + "id": 5, + "seek": 0, + "start": 10.38, + "end": 11.04, + "text": "2", + "tokens": [ + 17 + ], + "temperature": 0.0, + "avg_logprob": -0.28690400990572845, + "compression_ratio": 1.0, + "no_speech_prob": 0.8406417965888977, + "confidence": 0.919, + "words": [ + { + "text": "2", + "start": 10.38, + "end": 11.04, + "confidence": 0.919 + } + ] + }, + { + "id": 6, + "seek": 0, + "start": 11.54, + "end": 13.04, + "text": "2", + "tokens": [ + 17 + ], + "temperature": 0.0, + "avg_logprob": -0.28690400990572845, + "compression_ratio": 1.0, + "no_speech_prob": 0.8406417965888977, + "confidence": 0.657, + "words": [ + { + "text": "2", + "start": 11.54, + "end": 13.04, + "confidence": 0.657 + } + ] + }, + { + "id": 7, + "seek": 0, + "start": 13.52, + "end": 15.57, + "text": "2", + "tokens": [ + 17 + ], + "temperature": 0.0, + "avg_logprob": -0.28690400990572845, + "compression_ratio": 1.0, + "no_speech_prob": 0.8406417965888977, + "confidence": 0.772, + "words": [ + { + "text": "2", + "start": 13.52, + "end": 15.57, + "confidence": 0.772 + } + ] + }, + { + "id": 8, + "seek": 0, + "start": 15.57, + "end": 16.98, + "text": "2", + "tokens": [ + 17 + ], + "temperature": 0.0, + "avg_logprob": -0.28690400990572845, + "compression_ratio": 1.0, + "no_speech_prob": 0.8406417965888977, + "confidence": 0.905, + "words": [ + { + "text": "2", + "start": 15.57, + "end": 16.98, + "confidence": 0.905 + } + ] + }, + { + "id": 9, + "seek": 0, + "start": 17.52, + "end": 19.22, + "text": "2", + "tokens": [ + 17 + ], + "temperature": 0.0, + "avg_logprob": -0.28690400990572845, + "compression_ratio": 1.0, + "no_speech_prob": 0.8406417965888977, + "confidence": 0.808, + "words": [ + { + "text": "2", + "start": 17.52, + "end": 19.22, + "confidence": 0.808 + } + ] + }, + { + "id": 10, + "seek": 0, + "start": 19.62, + "end": 20.68, + "text": "2", + "tokens": [ + 17 + ], + "temperature": 0.0, + "avg_logprob": -0.28690400990572845, + "compression_ratio": 1.0, + "no_speech_prob": 0.8406417965888977, + "confidence": 0.626, + "words": [ + { + "text": "2", + "start": 19.62, + "end": 20.68, + "confidence": 0.626 + } + ] + }, + { + "id": 11, + "seek": 0, + "start": 22.22, + "end": 22.86, + "text": "2", + "tokens": [ + 17 + ], + "temperature": 0.0, + "avg_logprob": -0.28690400990572845, + "compression_ratio": 1.0, + "no_speech_prob": 0.8406417965888977, + "confidence": 0.835, + "words": [ + { + "text": "2", + "start": 22.22, + "end": 22.86, + "confidence": 0.835 + } + ] + }, + { + "id": 12, + "seek": 0, + "start": 23.52, + "end": 24.68, + "text": "2", + "tokens": [ + 17 + ], + "temperature": 0.0, + "avg_logprob": -0.28690400990572845, + "compression_ratio": 1.0, + "no_speech_prob": 0.8406417965888977, + "confidence": 0.974, + "words": [ + { + "text": "2", + "start": 23.52, + "end": 24.68, + "confidence": 0.974 + } + ] + }, + { + "id": 13, + "seek": 0, + "start": 25.7, + "end": 27.1, + "text": "2", + "tokens": [ + 17 + ], + "temperature": 0.0, + "avg_logprob": -0.28690400990572845, + "compression_ratio": 1.0, + "no_speech_prob": 0.8406417965888977, + "confidence": 0.97, + "words": [ + { + "text": "2", + "start": 25.7, + "end": 27.1, + "confidence": 0.97 + } + ] + }, + { + "id": 14, + "seek": 2800, + "start": 28.02, + "end": 28.86, + "text": "1", + "tokens": [ + 16 + ], + "temperature": 0.0, + "avg_logprob": -0.12449877912347967, + "compression_ratio": 1.2727272727272727, + "no_speech_prob": 0.022917350754141808, + "confidence": 0.271, + "words": [ + { + "text": "1", + "start": 28.02, + "end": 28.86, + "confidence": 0.271 + } + ] + }, + { + "id": 15, + "seek": 2800, + "start": 30.5, + "end": 31.12, + "text": "1", + "tokens": [ + 16 + ], + "temperature": 0.0, + "avg_logprob": -0.12449877912347967, + "compression_ratio": 1.2727272727272727, + "no_speech_prob": 0.022917350754141808, + "confidence": 0.504, + "words": [ + { + "text": "1", + "start": 30.5, + "end": 31.12, + "confidence": 0.504 + } + ] + }, + { + "id": 16, + "seek": 2800, + "start": 31.52, + "end": 33.55, + "text": "1", + "tokens": [ + 16 + ], + "temperature": 0.0, + "avg_logprob": -0.12449877912347967, + "compression_ratio": 1.2727272727272727, + "no_speech_prob": 0.022917350754141808, + "confidence": 0.911, + "words": [ + { + "text": "1", + "start": 31.52, + "end": 33.55, + "confidence": 0.911 + } + ] + }, + { + "id": 17, + "seek": 2800, + "start": 33.55, + "end": 35.02, + "text": "1", + "tokens": [ + 16 + ], + "temperature": 0.0, + "avg_logprob": -0.12449877912347967, + "compression_ratio": 1.2727272727272727, + "no_speech_prob": 0.022917350754141808, + "confidence": 0.894, + "words": [ + { + "text": "1", + "start": 33.55, + "end": 35.02, + "confidence": 0.894 + } + ] + }, + { + "id": 18, + "seek": 2800, + "start": 36.24, + "end": 37.52, + "text": "1", + "tokens": [ + 16 + ], + "temperature": 0.0, + "avg_logprob": -0.12449877912347967, + "compression_ratio": 1.2727272727272727, + "no_speech_prob": 0.022917350754141808, + "confidence": 0.957, + "words": [ + { + "text": "1", + "start": 36.24, + "end": 37.52, + "confidence": 0.957 + } + ] + }, + { + "id": 19, + "seek": 2800, + "start": 37.68, + "end": 39.8, + "text": "1", + "tokens": [ + 16 + ], + "temperature": 0.0, + "avg_logprob": -0.12449877912347967, + "compression_ratio": 1.2727272727272727, + "no_speech_prob": 0.022917350754141808, + "confidence": 0.958, + "words": [ + { + "text": "1", + "start": 37.68, + "end": 39.8, + "confidence": 0.958 + } + ] + }, + { + "id": 20, + "seek": 2800, + "start": 39.8, + "end": 41.2, + "text": "1", + "tokens": [ + 16 + ], + "temperature": 0.0, + "avg_logprob": -0.12449877912347967, + "compression_ratio": 1.2727272727272727, + "no_speech_prob": 0.022917350754141808, + "confidence": 0.967, + "words": [ + { + "text": "1", + "start": 39.8, + "end": 41.2, + "confidence": 0.967 + } + ] + }, + { + "id": 21, + "seek": 2800, + "start": 41.52, + "end": 44.02, + "text": "1", + "tokens": [ + 16 + ], + "temperature": 0.0, + "avg_logprob": -0.12449877912347967, + "compression_ratio": 1.2727272727272727, + "no_speech_prob": 0.022917350754141808, + "confidence": 0.973, + "words": [ + { + "text": "1", + "start": 41.52, + "end": 44.02, + "confidence": 0.973 + } + ] + }, + { + "id": 22, + "seek": 2800, + "start": 44.02, + "end": 45.04, + "text": "1", + "tokens": [ + 16 + ], + "temperature": 0.0, + "avg_logprob": -0.12449877912347967, + "compression_ratio": 1.2727272727272727, + "no_speech_prob": 0.022917350754141808, + "confidence": 0.944, + "words": [ + { + "text": "1", + "start": 44.02, + "end": 45.04, + "confidence": 0.944 + } + ] + }, + { + "id": 23, + "seek": 2800, + "start": 45.52, + "end": 47.53, + "text": "1", + "tokens": [ + 16 + ], + "temperature": 0.0, + "avg_logprob": -0.12449877912347967, + "compression_ratio": 1.2727272727272727, + "no_speech_prob": 0.022917350754141808, + "confidence": 0.959, + "words": [ + { + "text": "1", + "start": 45.52, + "end": 47.53, + "confidence": 0.959 + } + ] + }, + { + "id": 24, + "seek": 2800, + "start": 47.53, + "end": 48.94, + "text": "1", + "tokens": [ + 16 + ], + "temperature": 0.0, + "avg_logprob": -0.12449877912347967, + "compression_ratio": 1.2727272727272727, + "no_speech_prob": 0.022917350754141808, + "confidence": 0.966, + "words": [ + { + "text": "1", + "start": 47.53, + "end": 48.94, + "confidence": 0.966 + } + ] + }, + { + "id": 25, + "seek": 2800, + "start": 50.2, + "end": 52.06, + "text": "1", + "tokens": [ + 16 + ], + "temperature": 0.0, + "avg_logprob": -0.12449877912347967, + "compression_ratio": 1.2727272727272727, + "no_speech_prob": 0.022917350754141808, + "confidence": 0.968, + "words": [ + { + "text": "1", + "start": 50.2, + "end": 52.06, + "confidence": 0.968 + } + ] + }, + { + "id": 26, + "seek": 2800, + "start": 52.32, + "end": 52.84, + "text": "1", + "tokens": [ + 16 + ], + "temperature": 0.0, + "avg_logprob": -0.12449877912347967, + "compression_ratio": 1.2727272727272727, + "no_speech_prob": 0.022917350754141808, + "confidence": 0.964, + "words": [ + { + "text": "1", + "start": 52.32, + "end": 52.84, + "confidence": 0.964 + } + ] + }, + { + "id": 27, + "seek": 2800, + "start": 53.64, + "end": 54.9, + "text": "1", + "tokens": [ + 16 + ], + "temperature": 0.0, + "avg_logprob": -0.12449877912347967, + "compression_ratio": 1.2727272727272727, + "no_speech_prob": 0.022917350754141808, + "confidence": 0.944, + "words": [ + { + "text": "1", + "start": 53.64, + "end": 54.9, + "confidence": 0.944 + } + ] + }, + { + "id": 28, + "seek": 5600, + "start": 56.02, + "end": 57.06, + "text": "1", + "tokens": [ + 16 + ], + "temperature": 0.0, + "avg_logprob": -0.12232361056587913, + "compression_ratio": 1.2727272727272727, + "no_speech_prob": 0.015843844041228294, + "confidence": 0.377, + "words": [ + { + "text": "1", + "start": 56.02, + "end": 57.06, + "confidence": 0.377 + } + ] + }, + { + "id": 29, + "seek": 5600, + "start": 57.52, + "end": 58.8, + "text": "1", + "tokens": [ + 16 + ], + "temperature": 0.0, + "avg_logprob": -0.12232361056587913, + "compression_ratio": 1.2727272727272727, + "no_speech_prob": 0.015843844041228294, + "confidence": 0.763, + "words": [ + { + "text": "1", + "start": 57.52, + "end": 58.8, + "confidence": 0.763 + } + ] + }, + { + "id": 30, + "seek": 5600, + "start": 59.8, + "end": 61.08, + "text": "1", + "tokens": [ + 16 + ], + "temperature": 0.0, + "avg_logprob": -0.12232361056587913, + "compression_ratio": 1.2727272727272727, + "no_speech_prob": 0.015843844041228294, + "confidence": 0.952, + "words": [ + { + "text": "1", + "start": 59.8, + "end": 61.08, + "confidence": 0.952 + } + ] + }, + { + "id": 31, + "seek": 5600, + "start": 61.52, + "end": 63.08, + "text": "1", + "tokens": [ + 16 + ], + "temperature": 0.0, + "avg_logprob": -0.12232361056587913, + "compression_ratio": 1.2727272727272727, + "no_speech_prob": 0.015843844041228294, + "confidence": 0.949, + "words": [ + { + "text": "1", + "start": 61.52, + "end": 63.08, + "confidence": 0.949 + } + ] + }, + { + "id": 32, + "seek": 5600, + "start": 64.04, + "end": 65.18, + "text": "1", + "tokens": [ + 16 + ], + "temperature": 0.0, + "avg_logprob": -0.12232361056587913, + "compression_ratio": 1.2727272727272727, + "no_speech_prob": 0.015843844041228294, + "confidence": 0.954, + "words": [ + { + "text": "1", + "start": 64.04, + "end": 65.18, + "confidence": 0.954 + } + ] + }, + { + "id": 33, + "seek": 5600, + "start": 65.52, + "end": 66.7, + "text": "1", + "tokens": [ + 16 + ], + "temperature": 0.0, + "avg_logprob": -0.12232361056587913, + "compression_ratio": 1.2727272727272727, + "no_speech_prob": 0.015843844041228294, + "confidence": 0.952, + "words": [ + { + "text": "1", + "start": 65.52, + "end": 66.7, + "confidence": 0.952 + } + ] + }, + { + "id": 34, + "seek": 5600, + "start": 67.52, + "end": 69.08, + "text": "1", + "tokens": [ + 16 + ], + "temperature": 0.0, + "avg_logprob": -0.12232361056587913, + "compression_ratio": 1.2727272727272727, + "no_speech_prob": 0.015843844041228294, + "confidence": 0.966, + "words": [ + { + "text": "1", + "start": 67.52, + "end": 69.08, + "confidence": 0.966 + } + ] + }, + { + "id": 35, + "seek": 5600, + "start": 69.58, + "end": 71.65, + "text": "1", + "tokens": [ + 16 + ], + "temperature": 0.0, + "avg_logprob": -0.12232361056587913, + "compression_ratio": 1.2727272727272727, + "no_speech_prob": 0.015843844041228294, + "confidence": 0.958, + "words": [ + { + "text": "1", + "start": 69.58, + "end": 71.65, + "confidence": 0.958 + } + ] + }, + { + "id": 36, + "seek": 5600, + "start": 71.65, + "end": 73.62, + "text": "1", + "tokens": [ + 16 + ], + "temperature": 0.0, + "avg_logprob": -0.12232361056587913, + "compression_ratio": 1.2727272727272727, + "no_speech_prob": 0.015843844041228294, + "confidence": 0.957, + "words": [ + { + "text": "1", + "start": 71.65, + "end": 73.62, + "confidence": 0.957 + } + ] + }, + { + "id": 37, + "seek": 5600, + "start": 73.62, + "end": 75.85, + "text": "1", + "tokens": [ + 16 + ], + "temperature": 0.0, + "avg_logprob": -0.12232361056587913, + "compression_ratio": 1.2727272727272727, + "no_speech_prob": 0.015843844041228294, + "confidence": 0.953, + "words": [ + { + "text": "1", + "start": 73.62, + "end": 75.85, + "confidence": 0.953 + } + ] + }, + { + "id": 38, + "seek": 5600, + "start": 75.85, + "end": 77.12, + "text": "1", + "tokens": [ + 16 + ], + "temperature": 0.0, + "avg_logprob": -0.12232361056587913, + "compression_ratio": 1.2727272727272727, + "no_speech_prob": 0.015843844041228294, + "confidence": 0.942, + "words": [ + { + "text": "1", + "start": 75.85, + "end": 77.12, + "confidence": 0.942 + } + ] + }, + { + "id": 39, + "seek": 5600, + "start": 78.22, + "end": 78.78, + "text": "1", + "tokens": [ + 16 + ], + "temperature": 0.0, + "avg_logprob": -0.12232361056587913, + "compression_ratio": 1.2727272727272727, + "no_speech_prob": 0.015843844041228294, + "confidence": 0.936, + "words": [ + { + "text": "1", + "start": 78.22, + "end": 78.78, + "confidence": 0.936 + } + ] + }, + { + "id": 40, + "seek": 5600, + "start": 80.08, + "end": 80.86, + "text": "1", + "tokens": [ + 16 + ], + "temperature": 0.0, + "avg_logprob": -0.12232361056587913, + "compression_ratio": 1.2727272727272727, + "no_speech_prob": 0.015843844041228294, + "confidence": 0.929, + "words": [ + { + "text": "1", + "start": 80.08, + "end": 80.86, + "confidence": 0.929 + } + ] + }, + { + "id": 41, + "seek": 5600, + "start": 81.52, + "end": 82.7, + "text": "1", + "tokens": [ + 16 + ], + "temperature": 0.0, + "avg_logprob": -0.12232361056587913, + "compression_ratio": 1.2727272727272727, + "no_speech_prob": 0.015843844041228294, + "confidence": 0.903, + "words": [ + { + "text": "1", + "start": 81.52, + "end": 82.7, + "confidence": 0.903 + } + ] + }, + { + "id": 42, + "seek": 8400, + "start": 84.88, + "end": 85.08, + "text": "1", + "tokens": [ + 16 + ], + "temperature": 0.0, + "avg_logprob": -0.10775410045276988, + "compression_ratio": 1.2727272727272727, + "no_speech_prob": 0.02908501960337162, + "confidence": 0.82, + "words": [ + { + "text": "1", + "start": 84.88, + "end": 85.08, + "confidence": 0.82 + } + ] + }, + { + "id": 43, + "seek": 8400, + "start": 85.58, + "end": 86.86, + "text": "1", + "tokens": [ + 16 + ], + "temperature": 0.0, + "avg_logprob": -0.10775410045276988, + "compression_ratio": 1.2727272727272727, + "no_speech_prob": 0.02908501960337162, + "confidence": 0.884, + "words": [ + { + "text": "1", + "start": 85.58, + "end": 86.86, + "confidence": 0.884 + } + ] + }, + { + "id": 44, + "seek": 8400, + "start": 88.02, + "end": 89.2, + "text": "1", + "tokens": [ + 16 + ], + "temperature": 0.0, + "avg_logprob": -0.10775410045276988, + "compression_ratio": 1.2727272727272727, + "no_speech_prob": 0.02908501960337162, + "confidence": 0.957, + "words": [ + { + "text": "1", + "start": 88.02, + "end": 89.2, + "confidence": 0.957 + } + ] + }, + { + "id": 45, + "seek": 8400, + "start": 89.52, + "end": 90.98, + "text": "1", + "tokens": [ + 16 + ], + "temperature": 0.0, + "avg_logprob": -0.10775410045276988, + "compression_ratio": 1.2727272727272727, + "no_speech_prob": 0.02908501960337162, + "confidence": 0.952, + "words": [ + { + "text": "1", + "start": 89.52, + "end": 90.98, + "confidence": 0.952 + } + ] + }, + { + "id": 46, + "seek": 8400, + "start": 92.5, + "end": 93.04, + "text": "1", + "tokens": [ + 16 + ], + "temperature": 0.0, + "avg_logprob": -0.10775410045276988, + "compression_ratio": 1.2727272727272727, + "no_speech_prob": 0.02908501960337162, + "confidence": 0.917, + "words": [ + { + "text": "1", + "start": 92.5, + "end": 93.04, + "confidence": 0.917 + } + ] + }, + { + "id": 47, + "seek": 8400, + "start": 93.58, + "end": 95.56, + "text": "1", + "tokens": [ + 16 + ], + "temperature": 0.0, + "avg_logprob": -0.10775410045276988, + "compression_ratio": 1.2727272727272727, + "no_speech_prob": 0.02908501960337162, + "confidence": 0.947, + "words": [ + { + "text": "1", + "start": 93.58, + "end": 95.56, + "confidence": 0.947 + } + ] + }, + { + "id": 48, + "seek": 8400, + "start": 95.6, + "end": 97.95, + "text": "1", + "tokens": [ + 16 + ], + "temperature": 0.0, + "avg_logprob": -0.10775410045276988, + "compression_ratio": 1.2727272727272727, + "no_speech_prob": 0.02908501960337162, + "confidence": 0.97, + "words": [ + { + "text": "1", + "start": 95.6, + "end": 97.95, + "confidence": 0.97 + } + ] + }, + { + "id": 49, + "seek": 8400, + "start": 97.95, + "end": 99.14, + "text": "1", + "tokens": [ + 16 + ], + "temperature": 0.0, + "avg_logprob": -0.10775410045276988, + "compression_ratio": 1.2727272727272727, + "no_speech_prob": 0.02908501960337162, + "confidence": 0.976, + "words": [ + { + "text": "1", + "start": 97.95, + "end": 99.14, + "confidence": 0.976 + } + ] + }, + { + "id": 50, + "seek": 8400, + "start": 99.52, + "end": 101.08, + "text": "1", + "tokens": [ + 16 + ], + "temperature": 0.0, + "avg_logprob": -0.10775410045276988, + "compression_ratio": 1.2727272727272727, + "no_speech_prob": 0.02908501960337162, + "confidence": 0.984, + "words": [ + { + "text": "1", + "start": 99.52, + "end": 101.08, + "confidence": 0.984 + } + ] + }, + { + "id": 51, + "seek": 8400, + "start": 101.52, + "end": 103.62, + "text": "1", + "tokens": [ + 16 + ], + "temperature": 0.0, + "avg_logprob": -0.10775410045276988, + "compression_ratio": 1.2727272727272727, + "no_speech_prob": 0.02908501960337162, + "confidence": 0.985, + "words": [ + { + "text": "1", + "start": 101.52, + "end": 103.62, + "confidence": 0.985 + } + ] + }, + { + "id": 52, + "seek": 8400, + "start": 103.62, + "end": 105.7, + "text": "1", + "tokens": [ + 16 + ], + "temperature": 0.0, + "avg_logprob": -0.10775410045276988, + "compression_ratio": 1.2727272727272727, + "no_speech_prob": 0.02908501960337162, + "confidence": 0.988, + "words": [ + { + "text": "1", + "start": 103.62, + "end": 105.7, + "confidence": 0.988 + } + ] + }, + { + "id": 53, + "seek": 8400, + "start": 106.5, + "end": 107.12, + "text": "1", + "tokens": [ + 16 + ], + "temperature": 0.0, + "avg_logprob": -0.10775410045276988, + "compression_ratio": 1.2727272727272727, + "no_speech_prob": 0.02908501960337162, + "confidence": 0.957, + "words": [ + { + "text": "1", + "start": 106.5, + "end": 107.12, + "confidence": 0.957 + } + ] + }, + { + "id": 54, + "seek": 8400, + "start": 108.5, + "end": 109.22, + "text": "1", + "tokens": [ + 16 + ], + "temperature": 0.0, + "avg_logprob": -0.10775410045276988, + "compression_ratio": 1.2727272727272727, + "no_speech_prob": 0.02908501960337162, + "confidence": 0.946, + "words": [ + { + "text": "1", + "start": 108.5, + "end": 109.22, + "confidence": 0.946 + } + ] + }, + { + "id": 55, + "seek": 8400, + "start": 109.52, + "end": 111.36, + "text": "1", + "tokens": [ + 16 + ], + "temperature": 0.0, + "avg_logprob": -0.10775410045276988, + "compression_ratio": 1.2727272727272727, + "no_speech_prob": 0.02908501960337162, + "confidence": 0.89, + "words": [ + { + "text": "1", + "start": 109.52, + "end": 111.36, + "confidence": 0.89 + } + ] + }, + { + "id": 56, + "seek": 11200, + "start": 112.98, + "end": 113.34, + "text": "1", + "tokens": [ + 16 + ], + "temperature": 0.0, + "avg_logprob": -0.10804855823516846, + "compression_ratio": 1.2727272727272727, + "no_speech_prob": 0.04961525276303291, + "confidence": 0.895, + "words": [ + { + "text": "1", + "start": 112.98, + "end": 113.34, + "confidence": 0.895 + } + ] + }, + { + "id": 57, + "seek": 11200, + "start": 113.88, + "end": 114.52, + "text": "1", + "tokens": [ + 16 + ], + "temperature": 0.0, + "avg_logprob": -0.10804855823516846, + "compression_ratio": 1.2727272727272727, + "no_speech_prob": 0.04961525276303291, + "confidence": 0.871, + "words": [ + { + "text": "1", + "start": 113.88, + "end": 114.52, + "confidence": 0.871 + } + ] + }, + { + "id": 58, + "seek": 11200, + "start": 115.94, + "end": 117.2, + "text": "1", + "tokens": [ + 16 + ], + "temperature": 0.0, + "avg_logprob": -0.10804855823516846, + "compression_ratio": 1.2727272727272727, + "no_speech_prob": 0.04961525276303291, + "confidence": 0.977, + "words": [ + { + "text": "1", + "start": 115.94, + "end": 117.2, + "confidence": 0.977 + } + ] + }, + { + "id": 59, + "seek": 11200, + "start": 117.52, + "end": 118.64, + "text": "1", + "tokens": [ + 16 + ], + "temperature": 0.0, + "avg_logprob": -0.10804855823516846, + "compression_ratio": 1.2727272727272727, + "no_speech_prob": 0.04961525276303291, + "confidence": 0.975, + "words": [ + { + "text": "1", + "start": 117.52, + "end": 118.64, + "confidence": 0.975 + } + ] + }, + { + "id": 60, + "seek": 11200, + "start": 120.5, + "end": 120.8, + "text": "1", + "tokens": [ + 16 + ], + "temperature": 0.0, + "avg_logprob": -0.10804855823516846, + "compression_ratio": 1.2727272727272727, + "no_speech_prob": 0.04961525276303291, + "confidence": 0.957, + "words": [ + { + "text": "1", + "start": 120.5, + "end": 120.8, + "confidence": 0.957 + } + ] + }, + { + "id": 61, + "seek": 11200, + "start": 121.58, + "end": 123.74, + "text": "1", + "tokens": [ + 16 + ], + "temperature": 0.0, + "avg_logprob": -0.10804855823516846, + "compression_ratio": 1.2727272727272727, + "no_speech_prob": 0.04961525276303291, + "confidence": 0.959, + "words": [ + { + "text": "1", + "start": 121.58, + "end": 123.74, + "confidence": 0.959 + } + ] + }, + { + "id": 62, + "seek": 11200, + "start": 123.9, + "end": 125.56, + "text": "1", + "tokens": [ + 16 + ], + "temperature": 0.0, + "avg_logprob": -0.10804855823516846, + "compression_ratio": 1.2727272727272727, + "no_speech_prob": 0.04961525276303291, + "confidence": 0.967, + "words": [ + { + "text": "1", + "start": 123.9, + "end": 125.56, + "confidence": 0.967 + } + ] + }, + { + "id": 63, + "seek": 11200, + "start": 125.56, + "end": 127.34, + "text": "1", + "tokens": [ + 16 + ], + "temperature": 0.0, + "avg_logprob": -0.10804855823516846, + "compression_ratio": 1.2727272727272727, + "no_speech_prob": 0.04961525276303291, + "confidence": 0.968, + "words": [ + { + "text": "1", + "start": 125.56, + "end": 127.34, + "confidence": 0.968 + } + ] + }, + { + "id": 64, + "seek": 11200, + "start": 127.52, + "end": 129.2, + "text": "1", + "tokens": [ + 16 + ], + "temperature": 0.0, + "avg_logprob": -0.10804855823516846, + "compression_ratio": 1.2727272727272727, + "no_speech_prob": 0.04961525276303291, + "confidence": 0.96, + "words": [ + { + "text": "1", + "start": 127.52, + "end": 129.2, + "confidence": 0.96 + } + ] + }, + { + "id": 65, + "seek": 11200, + "start": 129.52, + "end": 131.06, + "text": "1", + "tokens": [ + 16 + ], + "temperature": 0.0, + "avg_logprob": -0.10804855823516846, + "compression_ratio": 1.2727272727272727, + "no_speech_prob": 0.04961525276303291, + "confidence": 0.965, + "words": [ + { + "text": "1", + "start": 129.52, + "end": 131.06, + "confidence": 0.965 + } + ] + }, + { + "id": 66, + "seek": 11200, + "start": 131.52, + "end": 133.3, + "text": "1", + "tokens": [ + 16 + ], + "temperature": 0.0, + "avg_logprob": -0.10804855823516846, + "compression_ratio": 1.2727272727272727, + "no_speech_prob": 0.04961525276303291, + "confidence": 0.969, + "words": [ + { + "text": "1", + "start": 131.52, + "end": 133.3, + "confidence": 0.969 + } + ] + }, + { + "id": 67, + "seek": 11200, + "start": 133.52, + "end": 135.73, + "text": "1", + "tokens": [ + 16 + ], + "temperature": 0.0, + "avg_logprob": -0.10804855823516846, + "compression_ratio": 1.2727272727272727, + "no_speech_prob": 0.04961525276303291, + "confidence": 0.966, + "words": [ + { + "text": "1", + "start": 133.52, + "end": 135.73, + "confidence": 0.966 + } + ] + }, + { + "id": 68, + "seek": 11200, + "start": 135.73, + "end": 137.34, + "text": "1", + "tokens": [ + 16 + ], + "temperature": 0.0, + "avg_logprob": -0.10804855823516846, + "compression_ratio": 1.2727272727272727, + "no_speech_prob": 0.04961525276303291, + "confidence": 0.971, + "words": [ + { + "text": "1", + "start": 135.73, + "end": 137.34, + "confidence": 0.971 + } + ] + }, + { + "id": 69, + "seek": 11200, + "start": 137.52, + "end": 139.8, + "text": "1", + "tokens": [ + 16 + ], + "temperature": 0.0, + "avg_logprob": -0.10804855823516846, + "compression_ratio": 1.2727272727272727, + "no_speech_prob": 0.04961525276303291, + "confidence": 0.925, + "words": [ + { + "text": "1", + "start": 137.52, + "end": 139.8, + "confidence": 0.925 + } + ] + } + ], + "language": "zh" +} \ No newline at end of file diff --git a/tests/expected/medium_auto.cpu/smartphone.mp3.words.json b/tests/expected/medium_auto.cpu/smartphone.mp3.words.json new file mode 100644 index 0000000000000000000000000000000000000000..9faa961d5cf4a38b6ac04b76010aeaddb28cee89 --- /dev/null +++ b/tests/expected/medium_auto.cpu/smartphone.mp3.words.json @@ -0,0 +1,4802 @@ +{ + "text": " C'est évident ce que dit Nicolas, mais je ne me l'étais jamais formulé comme ça. Ce qui fait la force du smartphone, c'est pas seulement l'accumulation des fonctions, mais la manière dont elles interagissent entre elles. Ce qui dit d'ailleurs sur la photo, c'est hyper convaincant. Alors évidemment, il faudrait ajouter les interfaces. L'écran tactile a été beaucoup très souvent mentionné. Mais bon, il faut dire qu'il profite aussi de 20 ans pendant lesquels les ordinateurs nous ont appris à cliquer sur des icônes. Sauf que le smartphone ajoute le toucher, ce qui rend le contact plus direct, plus sensible. Et puis évidemment, il faudrait parler aussi des applications qui permettent de contourner le côté touffu de la navigation web pour aller directement au but. Bref, tout ça, ce sont les conditions qui permettent de créer cet objet dont Nicolas dit qu'il est vraisemblablement inédit dans l'histoire de l'humanité. Mais ça, ça soulève une autre interrogation. Est-ce que le fait que cet objet soit inédit induit que notre rapport à lui est aussi un rapport inédit? Je veux dire, est-ce que le rapport qu'on a au smartphone est comparable à celui qu'on entretenait à d'autres objets techniques comme la voiture ou le téléphone? Il n'y a pas d'équivalent en fait. Et donc cette espèce de nouveauté dans la relation à l'objet, c'est fascinant et terrifiant. Parce qu'on a l'impression, comme le disent les utilisateurs et les services, d'être dépendants de cet objet, d'induire en fait une espèce de relation, de médiation avec le monde qui rend de l'ampleur et qui amène aussi à des formes de rejet. Donc, à objet inédit, rapport inédit. Et ce rapport, si j'en crois Nicolas, serait caractérisé par un mélange de dépendance et de rejet. Bon, en vrai, il faudrait remonter très très finement toute l'histoire des objets techniques et de leur insertion dans nos vies pour déterminer si ce rapport est totalement inédit. Mais j'ai l'impression comme ça que Nicolas ne se trompe pas vraiment. Pour autant que je sache, il y a eu plein de discussions autour de la voiture ou même du téléphone. Mais la dépendance n'était pas du même ordre. Donc le rejet non plus n'était pas du même ordre. On peut adorer sa bagnole, en avoir besoin pour plein de choses. Et bien, le soir, quand on va se coucher, on la laisse. On ne l'a pas dans la main quand on est au lit, on ne l'emmène pas au chiottes. On pouvait être énervé par son môme qui occupait la ligne de téléphone pendant une heure chaque soir pour discuter avec un copain. Mais ça ne ressemblait pas à ce qu'on peut ressentir à voir ce même môme aujourd'hui, continuellement avec son smartphone dans la main, comme si c'était une sorte de pacemaker externe, comme si le lâcher allait entraîner sa mort immédiate. Bon, je dis ça pour le môme, mais c'est évidemment valable pour nous aussi. Donc, rapport inédit. D'accord. Mais pourquoi a-t-on l'impression qu'on n'en sortira jamais? Est-ce qu'il faut en remettre la faute sur les gens qui ont créé cet outil merveilleux et diabolique, et diabolique parce que merveilleux? Les économistes parlent de dépendance du sentier. C'est l'idée qu'on est sur un sentier qui a été établi, soit volontairement en marchant dessus, soit en définissant des bornes, en définissant une signalétique.", + "segments": [ + { + "id": 0, + "seek": 0, + "start": 0.38, + "end": 3.62, + "text": " C'est évident ce que dit Nicolas, mais je ne me l'étais jamais formulé comme ça.", + "tokens": [ + 383, + 6, + 377, + 20090, + 1078, + 1769, + 631, + 6176, + 38268, + 11, + 2420, + 1506, + 408, + 385, + 287, + 6, + 22824, + 14540, + 49990, + 526, + 5173, + 2788, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.23666970461409614, + "compression_ratio": 1.6238532110091743, + "no_speech_prob": 0.1567964404821396, + "confidence": 0.935, + "words": [ + { + "text": "C'est", + "start": 0.38, + "end": 0.58, + "confidence": 0.961 + }, + { + "text": "évident", + "start": 0.58, + "end": 0.88, + "confidence": 0.984 + }, + { + "text": "ce", + "start": 0.88, + "end": 1.02, + "confidence": 0.663 + }, + { + "text": "que", + "start": 1.02, + "end": 1.08, + "confidence": 0.989 + }, + { + "text": "dit", + "start": 1.08, + "end": 1.2, + "confidence": 0.994 + }, + { + "text": "Nicolas,", + "start": 1.2, + "end": 1.78, + "confidence": 0.91 + }, + { + "text": "mais", + "start": 1.78, + "end": 1.9, + "confidence": 0.979 + }, + { + "text": "je", + "start": 1.9, + "end": 2.24, + "confidence": 0.982 + }, + { + "text": "ne", + "start": 2.24, + "end": 2.34, + "confidence": 0.835 + }, + { + "text": "me", + "start": 2.34, + "end": 2.38, + "confidence": 0.82 + }, + { + "text": "l'étais", + "start": 2.38, + "end": 2.58, + "confidence": 0.971 + }, + { + "text": "jamais", + "start": 2.58, + "end": 2.84, + "confidence": 0.989 + }, + { + "text": "formulé", + "start": 2.84, + "end": 3.26, + "confidence": 0.909 + }, + { + "text": "comme", + "start": 3.26, + "end": 3.42, + "confidence": 0.993 + }, + { + "text": "ça.", + "start": 3.42, + "end": 3.62, + "confidence": 0.975 + } + ] + }, + { + "id": 1, + "seek": 0, + "start": 4.08, + "end": 7.92, + "text": " Ce qui fait la force du smartphone, c'est pas seulement l'accumulation des fonctions,", + "tokens": [ + 8257, + 1956, + 3887, + 635, + 3464, + 1581, + 13307, + 11, + 269, + 6, + 377, + 1736, + 27772, + 287, + 6, + 8476, + 449, + 2776, + 730, + 17290, + 3916, + 11 + ], + "temperature": 0.0, + "avg_logprob": -0.23666970461409614, + "compression_ratio": 1.6238532110091743, + "no_speech_prob": 0.1567964404821396, + "confidence": 0.93, + "words": [ + { + "text": "Ce", + "start": 4.08, + "end": 4.26, + "confidence": 0.952 + }, + { + "text": "qui", + "start": 4.26, + "end": 4.34, + "confidence": 0.958 + }, + { + "text": "fait", + "start": 4.34, + "end": 4.48, + "confidence": 0.565 + }, + { + "text": "la", + "start": 4.48, + "end": 4.66, + "confidence": 0.971 + }, + { + "text": "force", + "start": 4.66, + "end": 5.0, + "confidence": 0.999 + }, + { + "text": "du", + "start": 5.0, + "end": 5.2, + "confidence": 0.996 + }, + { + "text": "smartphone,", + "start": 5.2, + "end": 5.88, + "confidence": 0.911 + }, + { + "text": "c'est", + "start": 5.88, + "end": 6.12, + "confidence": 0.88 + }, + { + "text": "pas", + "start": 6.12, + "end": 6.26, + "confidence": 0.992 + }, + { + "text": "seulement", + "start": 6.26, + "end": 6.52, + "confidence": 0.999 + }, + { + "text": "l'accumulation", + "start": 6.52, + "end": 7.38, + "confidence": 0.958 + }, + { + "text": "des", + "start": 7.38, + "end": 7.56, + "confidence": 0.983 + }, + { + "text": "fonctions,", + "start": 7.56, + "end": 7.92, + "confidence": 0.987 + } + ] + }, + { + "id": 2, + "seek": 0, + "start": 8.32, + "end": 10.88, + "text": " mais la manière dont elles interagissent entre elles.", + "tokens": [ + 2420, + 635, + 22267, + 9400, + 23576, + 728, + 559, + 25450, + 3962, + 23576, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.23666970461409614, + "compression_ratio": 1.6238532110091743, + "no_speech_prob": 0.1567964404821396, + "confidence": 0.977, + "words": [ + { + "text": "mais", + "start": 8.32, + "end": 8.44, + "confidence": 0.992 + }, + { + "text": "la", + "start": 8.44, + "end": 8.6, + "confidence": 0.995 + }, + { + "text": "manière", + "start": 8.6, + "end": 8.9, + "confidence": 0.999 + }, + { + "text": "dont", + "start": 8.9, + "end": 9.1, + "confidence": 0.978 + }, + { + "text": "elles", + "start": 9.1, + "end": 9.48, + "confidence": 0.967 + }, + { + "text": "interagissent", + "start": 9.48, + "end": 10.32, + "confidence": 0.964 + }, + { + "text": "entre", + "start": 10.32, + "end": 10.58, + "confidence": 0.956 + }, + { + "text": "elles.", + "start": 10.58, + "end": 10.88, + "confidence": 0.99 + } + ] + }, + { + "id": 3, + "seek": 0, + "start": 10.96, + "end": 13.0, + "text": " Ce qui dit d'ailleurs sur la photo, c'est hyper convaincant.", + "tokens": [ + 8257, + 1956, + 6176, + 274, + 6, + 19400, + 1022, + 635, + 5052, + 11, + 269, + 6, + 377, + 9848, + 3754, + 491, + 66, + 394, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.23666970461409614, + "compression_ratio": 1.6238532110091743, + "no_speech_prob": 0.1567964404821396, + "confidence": 0.906, + "words": [ + { + "text": "Ce", + "start": 10.96, + "end": 11.16, + "confidence": 0.607 + }, + { + "text": "qui", + "start": 11.16, + "end": 11.22, + "confidence": 0.765 + }, + { + "text": "dit", + "start": 11.22, + "end": 11.4, + "confidence": 0.983 + }, + { + "text": "d'ailleurs", + "start": 11.4, + "end": 11.56, + "confidence": 0.985 + }, + { + "text": "sur", + "start": 11.56, + "end": 11.72, + "confidence": 0.477 + }, + { + "text": "la", + "start": 11.72, + "end": 11.78, + "confidence": 0.984 + }, + { + "text": "photo,", + "start": 11.78, + "end": 12.12, + "confidence": 0.994 + }, + { + "text": "c'est", + "start": 12.12, + "end": 12.2, + "confidence": 0.997 + }, + { + "text": "hyper", + "start": 12.2, + "end": 12.42, + "confidence": 0.993 + }, + { + "text": "convaincant.", + "start": 12.42, + "end": 13.0, + "confidence": 0.982 + } + ] + }, + { + "id": 4, + "seek": 0, + "start": 13.34, + "end": 16.02, + "text": " Alors évidemment, il faudrait ajouter les interfaces.", + "tokens": [ + 9946, + 24724, + 11, + 1930, + 38694, + 8645, + 17680, + 23985, + 1512, + 28416, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.23666970461409614, + "compression_ratio": 1.6238532110091743, + "no_speech_prob": 0.1567964404821396, + "confidence": 0.913, + "words": [ + { + "text": "Alors", + "start": 13.34, + "end": 13.62, + "confidence": 0.585 + }, + { + "text": "évidemment,", + "start": 13.62, + "end": 14.34, + "confidence": 0.832 + }, + { + "text": "il", + "start": 14.34, + "end": 14.38, + "confidence": 0.952 + }, + { + "text": "faudrait", + "start": 14.38, + "end": 14.74, + "confidence": 0.996 + }, + { + "text": "ajouter", + "start": 14.74, + "end": 15.16, + "confidence": 0.992 + }, + { + "text": "les", + "start": 15.16, + "end": 15.52, + "confidence": 0.985 + }, + { + "text": "interfaces.", + "start": 15.52, + "end": 16.02, + "confidence": 0.984 + } + ] + }, + { + "id": 5, + "seek": 0, + "start": 16.22, + "end": 19.36, + "text": " L'écran tactile a été beaucoup très souvent mentionné.", + "tokens": [ + 441, + 6, + 9062, + 4257, + 47319, + 257, + 8862, + 8796, + 5732, + 20847, + 2152, + 15055, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.23666970461409614, + "compression_ratio": 1.6238532110091743, + "no_speech_prob": 0.1567964404821396, + "confidence": 0.923, + "words": [ + { + "text": "L'écran", + "start": 16.22, + "end": 16.7, + "confidence": 0.996 + }, + { + "text": "tactile", + "start": 16.7, + "end": 17.06, + "confidence": 0.986 + }, + { + "text": "a", + "start": 17.06, + "end": 17.26, + "confidence": 0.98 + }, + { + "text": "été", + "start": 17.26, + "end": 17.88, + "confidence": 0.975 + }, + { + "text": "beaucoup", + "start": 17.88, + "end": 18.28, + "confidence": 0.976 + }, + { + "text": "très", + "start": 18.28, + "end": 18.62, + "confidence": 0.447 + }, + { + "text": "souvent", + "start": 18.62, + "end": 18.9, + "confidence": 0.996 + }, + { + "text": "mentionné.", + "start": 18.9, + "end": 19.36, + "confidence": 0.978 + } + ] + }, + { + "id": 6, + "seek": 0, + "start": 19.84, + "end": 25.26, + "text": " Mais bon, il faut dire qu'il profite aussi de 20 ans pendant lesquels les ordinateurs nous ont appris à cliquer sur des icônes.", + "tokens": [ + 6313, + 4428, + 11, + 1930, + 8487, + 1264, + 421, + 6, + 388, + 1740, + 642, + 6212, + 368, + 945, + 1567, + 17338, + 1512, + 358, + 1625, + 1512, + 4792, + 13923, + 2156, + 4666, + 6592, + 724, + 5714, + 1531, + 596, + 23909, + 1022, + 730, + 4376, + 2851, + 4081, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.23666970461409614, + "compression_ratio": 1.6238532110091743, + "no_speech_prob": 0.1567964404821396, + "confidence": 0.92, + "words": [ + { + "text": "Mais", + "start": 19.84, + "end": 20.22, + "confidence": 0.944 + }, + { + "text": "bon,", + "start": 20.22, + "end": 20.52, + "confidence": 0.667 + }, + { + "text": "il", + "start": 20.52, + "end": 20.6, + "confidence": 0.99 + }, + { + "text": "faut", + "start": 20.6, + "end": 20.7, + "confidence": 0.99 + }, + { + "text": "dire", + "start": 20.7, + "end": 20.84, + "confidence": 0.995 + }, + { + "text": "qu'il", + "start": 20.84, + "end": 20.96, + "confidence": 0.88 + }, + { + "text": "profite", + "start": 20.96, + "end": 21.26, + "confidence": 0.995 + }, + { + "text": "aussi", + "start": 21.26, + "end": 21.68, + "confidence": 0.972 + }, + { + "text": "de", + "start": 21.68, + "end": 21.9, + "confidence": 0.97 + }, + { + "text": "20", + "start": 21.9, + "end": 22.1, + "confidence": 0.812 + }, + { + "text": "ans", + "start": 22.1, + "end": 22.32, + "confidence": 0.997 + }, + { + "text": "pendant", + "start": 22.32, + "end": 22.48, + "confidence": 0.72 + }, + { + "text": "lesquels", + "start": 22.48, + "end": 22.92, + "confidence": 0.98 + }, + { + "text": "les", + "start": 22.92, + "end": 23.04, + "confidence": 0.709 + }, + { + "text": "ordinateurs", + "start": 23.04, + "end": 23.54, + "confidence": 0.965 + }, + { + "text": "nous", + "start": 23.54, + "end": 23.72, + "confidence": 0.602 + }, + { + "text": "ont", + "start": 23.72, + "end": 23.82, + "confidence": 0.974 + }, + { + "text": "appris", + "start": 23.82, + "end": 24.1, + "confidence": 0.991 + }, + { + "text": "à", + "start": 24.1, + "end": 24.24, + "confidence": 0.829 + }, + { + "text": "cliquer", + "start": 24.24, + "end": 24.5, + "confidence": 0.989 + }, + { + "text": "sur", + "start": 24.5, + "end": 24.66, + "confidence": 0.984 + }, + { + "text": "des", + "start": 24.66, + "end": 24.94, + "confidence": 0.971 + }, + { + "text": "icônes.", + "start": 24.94, + "end": 25.26, + "confidence": 0.992 + } + ] + }, + { + "id": 7, + "seek": 2534, + "start": 25.42, + "end": 30.64, + "text": " Sauf que le smartphone ajoute le toucher, ce qui rend le contact plus direct, plus sensible.", + "tokens": [ + 318, + 9507, + 631, + 476, + 13307, + 17680, + 14040, + 476, + 2557, + 260, + 11, + 1769, + 1956, + 6125, + 476, + 3385, + 1804, + 2047, + 11, + 1804, + 25380, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.07915337880452473, + "compression_ratio": 1.6254416961130742, + "no_speech_prob": 3.457161710684886e-06, + "confidence": 0.969, + "words": [ + { + "text": "Sauf", + "start": 25.42, + "end": 25.76, + "confidence": 0.99 + }, + { + "text": "que", + "start": 25.76, + "end": 26.26, + "confidence": 0.996 + }, + { + "text": "le", + "start": 26.26, + "end": 26.66, + "confidence": 0.631 + }, + { + "text": "smartphone", + "start": 26.66, + "end": 27.06, + "confidence": 0.996 + }, + { + "text": "ajoute", + "start": 27.06, + "end": 27.44, + "confidence": 0.991 + }, + { + "text": "le", + "start": 27.44, + "end": 27.62, + "confidence": 0.992 + }, + { + "text": "toucher,", + "start": 27.62, + "end": 28.18, + "confidence": 0.988 + }, + { + "text": "ce", + "start": 28.18, + "end": 28.22, + "confidence": 0.99 + }, + { + "text": "qui", + "start": 28.22, + "end": 28.28, + "confidence": 1.0 + }, + { + "text": "rend", + "start": 28.28, + "end": 28.48, + "confidence": 0.994 + }, + { + "text": "le", + "start": 28.48, + "end": 28.68, + "confidence": 0.993 + }, + { + "text": "contact", + "start": 28.68, + "end": 29.1, + "confidence": 0.999 + }, + { + "text": "plus", + "start": 29.1, + "end": 29.46, + "confidence": 0.985 + }, + { + "text": "direct,", + "start": 29.46, + "end": 30.22, + "confidence": 0.995 + }, + { + "text": "plus", + "start": 30.22, + "end": 30.26, + "confidence": 0.994 + }, + { + "text": "sensible.", + "start": 30.26, + "end": 30.64, + "confidence": 0.997 + } + ] + }, + { + "id": 8, + "seek": 2534, + "start": 31.04, + "end": 37.82, + "text": " Et puis évidemment, il faudrait parler aussi des applications qui permettent de contourner le côté touffu de la navigation web pour aller directement au but.", + "tokens": [ + 3790, + 9093, + 24724, + 11, + 1930, + 38694, + 8645, + 16421, + 6212, + 730, + 5821, + 1956, + 21540, + 317, + 368, + 21234, + 1193, + 476, + 18437, + 10095, + 602, + 84, + 368, + 635, + 17346, + 3670, + 2016, + 8722, + 37297, + 1609, + 457, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.07915337880452473, + "compression_ratio": 1.6254416961130742, + "no_speech_prob": 3.457161710684886e-06, + "confidence": 0.892, + "words": [ + { + "text": "Et", + "start": 31.04, + "end": 31.22, + "confidence": 0.97 + }, + { + "text": "puis", + "start": 31.22, + "end": 31.36, + "confidence": 0.971 + }, + { + "text": "évidemment,", + "start": 31.36, + "end": 31.7, + "confidence": 0.875 + }, + { + "text": "il", + "start": 31.7, + "end": 31.74, + "confidence": 0.993 + }, + { + "text": "faudrait", + "start": 31.74, + "end": 31.94, + "confidence": 0.995 + }, + { + "text": "parler", + "start": 31.94, + "end": 32.12, + "confidence": 0.84 + }, + { + "text": "aussi", + "start": 32.12, + "end": 32.34, + "confidence": 0.977 + }, + { + "text": "des", + "start": 32.34, + "end": 32.48, + "confidence": 0.994 + }, + { + "text": "applications", + "start": 32.48, + "end": 32.9, + "confidence": 0.993 + }, + { + "text": "qui", + "start": 32.9, + "end": 33.18, + "confidence": 0.481 + }, + { + "text": "permettent", + "start": 33.18, + "end": 33.74, + "confidence": 0.992 + }, + { + "text": "de", + "start": 33.74, + "end": 33.96, + "confidence": 0.885 + }, + { + "text": "contourner", + "start": 33.96, + "end": 34.42, + "confidence": 0.958 + }, + { + "text": "le", + "start": 34.42, + "end": 34.52, + "confidence": 0.775 + }, + { + "text": "côté", + "start": 34.52, + "end": 34.8, + "confidence": 0.984 + }, + { + "text": "touffu", + "start": 34.8, + "end": 35.32, + "confidence": 0.741 + }, + { + "text": "de", + "start": 35.32, + "end": 35.72, + "confidence": 0.882 + }, + { + "text": "la", + "start": 35.72, + "end": 35.78, + "confidence": 0.992 + }, + { + "text": "navigation", + "start": 35.78, + "end": 36.24, + "confidence": 0.994 + }, + { + "text": "web", + "start": 36.24, + "end": 36.6, + "confidence": 0.854 + }, + { + "text": "pour", + "start": 36.6, + "end": 36.78, + "confidence": 0.585 + }, + { + "text": "aller", + "start": 36.78, + "end": 36.98, + "confidence": 0.987 + }, + { + "text": "directement", + "start": 36.98, + "end": 37.52, + "confidence": 0.997 + }, + { + "text": "au", + "start": 37.52, + "end": 37.68, + "confidence": 0.967 + }, + { + "text": "but.", + "start": 37.68, + "end": 37.82, + "confidence": 0.995 + } + ] + }, + { + "id": 9, + "seek": 2534, + "start": 37.82, + "end": 46.54, + "text": " Bref, tout ça, ce sont les conditions qui permettent de créer cet objet dont Nicolas dit qu'il est vraisemblablement inédit dans l'histoire de l'humanité.", + "tokens": [ + 49957, + 11, + 3486, + 2788, + 11, + 1769, + 4900, + 1512, + 4487, + 1956, + 21540, + 317, + 368, + 32062, + 8603, + 14964, + 9400, + 38268, + 6176, + 421, + 6, + 388, + 871, + 6070, + 271, + 443, + 5199, + 712, + 518, + 294, + 7811, + 270, + 2680, + 287, + 6, + 29093, + 368, + 287, + 6, + 18796, + 5066, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.07915337880452473, + "compression_ratio": 1.6254416961130742, + "no_speech_prob": 3.457161710684886e-06, + "confidence": 0.974, + "words": [ + { + "text": "Bref,", + "start": 37.82, + "end": 38.76, + "confidence": 0.987 + }, + { + "text": "tout", + "start": 38.76, + "end": 38.98, + "confidence": 0.711 + }, + { + "text": "ça,", + "start": 38.98, + "end": 39.42, + "confidence": 0.995 + }, + { + "text": "ce", + "start": 39.42, + "end": 39.7, + "confidence": 0.993 + }, + { + "text": "sont", + "start": 39.7, + "end": 39.88, + "confidence": 0.999 + }, + { + "text": "les", + "start": 39.88, + "end": 40.16, + "confidence": 0.991 + }, + { + "text": "conditions", + "start": 40.16, + "end": 40.68, + "confidence": 0.995 + }, + { + "text": "qui", + "start": 40.68, + "end": 40.96, + "confidence": 0.997 + }, + { + "text": "permettent", + "start": 40.96, + "end": 41.46, + "confidence": 0.997 + }, + { + "text": "de", + "start": 41.46, + "end": 41.6, + "confidence": 0.998 + }, + { + "text": "créer", + "start": 41.6, + "end": 42.06, + "confidence": 0.998 + }, + { + "text": "cet", + "start": 42.06, + "end": 42.38, + "confidence": 0.998 + }, + { + "text": "objet", + "start": 42.38, + "end": 42.6, + "confidence": 0.994 + }, + { + "text": "dont", + "start": 42.6, + "end": 42.8, + "confidence": 0.779 + }, + { + "text": "Nicolas", + "start": 42.8, + "end": 43.26, + "confidence": 0.989 + }, + { + "text": "dit", + "start": 43.26, + "end": 43.5, + "confidence": 0.986 + }, + { + "text": "qu'il", + "start": 43.5, + "end": 43.7, + "confidence": 0.983 + }, + { + "text": "est", + "start": 43.7, + "end": 43.88, + "confidence": 0.991 + }, + { + "text": "vraisemblablement", + "start": 43.88, + "end": 44.98, + "confidence": 0.991 + }, + { + "text": "inédit", + "start": 44.98, + "end": 45.38, + "confidence": 0.98 + }, + { + "text": "dans", + "start": 45.38, + "end": 45.7, + "confidence": 0.969 + }, + { + "text": "l'histoire", + "start": 45.7, + "end": 45.98, + "confidence": 0.957 + }, + { + "text": "de", + "start": 45.98, + "end": 46.18, + "confidence": 0.999 + }, + { + "text": "l'humanité.", + "start": 46.18, + "end": 46.54, + "confidence": 0.992 + } + ] + }, + { + "id": 10, + "seek": 2534, + "start": 46.54, + "end": 48.82, + "text": " Mais ça, ça soulève une autre interrogation.", + "tokens": [ + 6313, + 2788, + 11, + 2788, + 5133, + 31397, + 2251, + 15081, + 24871, + 399, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.07915337880452473, + "compression_ratio": 1.6254416961130742, + "no_speech_prob": 3.457161710684886e-06, + "confidence": 0.969, + "words": [ + { + "text": "Mais", + "start": 46.54, + "end": 47.24, + "confidence": 0.846 + }, + { + "text": "ça,", + "start": 47.24, + "end": 47.72, + "confidence": 0.935 + }, + { + "text": "ça", + "start": 47.72, + "end": 47.76, + "confidence": 0.977 + }, + { + "text": "soulève", + "start": 47.76, + "end": 47.84, + "confidence": 0.993 + }, + { + "text": "une", + "start": 47.84, + "end": 48.02, + "confidence": 0.998 + }, + { + "text": "autre", + "start": 48.02, + "end": 48.26, + "confidence": 0.999 + }, + { + "text": "interrogation.", + "start": 48.26, + "end": 48.82, + "confidence": 0.997 + } + ] + }, + { + "id": 11, + "seek": 4884, + "start": 49.22, + "end": 55.46, + "text": " Est-ce que le fait que cet objet soit inédit induit que notre rapport à lui est aussi un rapport inédit?", + "tokens": [ + 4410, + 12, + 384, + 631, + 476, + 3887, + 631, + 8603, + 14964, + 12703, + 294, + 7811, + 270, + 13716, + 270, + 631, + 10349, + 18018, + 1531, + 8783, + 871, + 6212, + 517, + 18018, + 294, + 7811, + 270, + 2506 + ], + "temperature": 0.0, + "avg_logprob": -0.10746372298689078, + "compression_ratio": 1.662379421221865, + "no_speech_prob": 1.3105129255563952e-05, + "confidence": 0.988, + "words": [ + { + "text": "Est-ce", + "start": 49.22, + "end": 49.62, + "confidence": 0.982 + }, + { + "text": "que", + "start": 49.62, + "end": 49.72, + "confidence": 0.991 + }, + { + "text": "le", + "start": 49.72, + "end": 49.82, + "confidence": 0.993 + }, + { + "text": "fait", + "start": 49.82, + "end": 49.98, + "confidence": 0.999 + }, + { + "text": "que", + "start": 49.98, + "end": 50.14, + "confidence": 0.991 + }, + { + "text": "cet", + "start": 50.14, + "end": 50.32, + "confidence": 0.991 + }, + { + "text": "objet", + "start": 50.32, + "end": 50.66, + "confidence": 0.997 + }, + { + "text": "soit", + "start": 50.66, + "end": 51.12, + "confidence": 0.995 + }, + { + "text": "inédit", + "start": 51.12, + "end": 51.8, + "confidence": 0.996 + }, + { + "text": "induit", + "start": 51.8, + "end": 52.32, + "confidence": 0.977 + }, + { + "text": "que", + "start": 52.32, + "end": 52.42, + "confidence": 0.983 + }, + { + "text": "notre", + "start": 52.42, + "end": 52.72, + "confidence": 0.996 + }, + { + "text": "rapport", + "start": 52.72, + "end": 53.28, + "confidence": 0.997 + }, + { + "text": "à", + "start": 53.28, + "end": 53.44, + "confidence": 0.978 + }, + { + "text": "lui", + "start": 53.44, + "end": 53.66, + "confidence": 0.999 + }, + { + "text": "est", + "start": 53.66, + "end": 54.02, + "confidence": 0.916 + }, + { + "text": "aussi", + "start": 54.02, + "end": 54.54, + "confidence": 0.995 + }, + { + "text": "un", + "start": 54.54, + "end": 54.7, + "confidence": 0.995 + }, + { + "text": "rapport", + "start": 54.7, + "end": 55.0, + "confidence": 0.996 + }, + { + "text": "inédit?", + "start": 55.0, + "end": 55.46, + "confidence": 0.996 + } + ] + }, + { + "id": 12, + "seek": 4884, + "start": 55.46, + "end": 63.12, + "text": " Je veux dire, est-ce que le rapport qu'on a au smartphone est comparable à celui qu'on entretenait à d'autres objets techniques comme la voiture ou le téléphone?", + "tokens": [ + 2588, + 16389, + 1264, + 11, + 871, + 12, + 384, + 631, + 476, + 18018, + 421, + 6, + 266, + 257, + 1609, + 13307, + 871, + 25323, + 1531, + 22829, + 421, + 6, + 266, + 3962, + 1147, + 1001, + 1531, + 274, + 6, + 16752, + 1111, + 25349, + 7512, + 5173, + 635, + 38859, + 2820, + 476, + 47159, + 2506 + ], + "temperature": 0.0, + "avg_logprob": -0.10746372298689078, + "compression_ratio": 1.662379421221865, + "no_speech_prob": 1.3105129255563952e-05, + "confidence": 0.965, + "words": [ + { + "text": "Je", + "start": 55.46, + "end": 55.9, + "confidence": 0.88 + }, + { + "text": "veux", + "start": 55.9, + "end": 56.0, + "confidence": 0.988 + }, + { + "text": "dire,", + "start": 56.0, + "end": 56.24, + "confidence": 0.997 + }, + { + "text": "est-ce", + "start": 56.24, + "end": 56.36, + "confidence": 0.99 + }, + { + "text": "que", + "start": 56.36, + "end": 56.42, + "confidence": 0.99 + }, + { + "text": "le", + "start": 56.42, + "end": 56.58, + "confidence": 0.995 + }, + { + "text": "rapport", + "start": 56.58, + "end": 56.88, + "confidence": 0.998 + }, + { + "text": "qu'on", + "start": 56.88, + "end": 57.04, + "confidence": 0.986 + }, + { + "text": "a", + "start": 57.04, + "end": 57.18, + "confidence": 0.989 + }, + { + "text": "au", + "start": 57.18, + "end": 57.28, + "confidence": 0.968 + }, + { + "text": "smartphone", + "start": 57.28, + "end": 57.6, + "confidence": 0.994 + }, + { + "text": "est", + "start": 57.6, + "end": 57.92, + "confidence": 0.95 + }, + { + "text": "comparable", + "start": 57.92, + "end": 58.24, + "confidence": 0.997 + }, + { + "text": "à", + "start": 58.24, + "end": 58.48, + "confidence": 0.949 + }, + { + "text": "celui", + "start": 58.48, + "end": 58.66, + "confidence": 0.998 + }, + { + "text": "qu'on", + "start": 58.66, + "end": 58.9, + "confidence": 0.989 + }, + { + "text": "entretenait", + "start": 58.9, + "end": 59.32, + "confidence": 0.929 + }, + { + "text": "à", + "start": 59.32, + "end": 59.46, + "confidence": 0.958 + }, + { + "text": "d'autres", + "start": 59.46, + "end": 59.7, + "confidence": 0.997 + }, + { + "text": "objets", + "start": 59.7, + "end": 59.96, + "confidence": 0.991 + }, + { + "text": "techniques", + "start": 59.96, + "end": 60.46, + "confidence": 0.983 + }, + { + "text": "comme", + "start": 60.46, + "end": 60.88, + "confidence": 0.587 + }, + { + "text": "la", + "start": 60.88, + "end": 61.5, + "confidence": 0.987 + }, + { + "text": "voiture", + "start": 61.5, + "end": 62.06, + "confidence": 1.0 + }, + { + "text": "ou", + "start": 62.06, + "end": 62.36, + "confidence": 0.945 + }, + { + "text": "le", + "start": 62.36, + "end": 62.68, + "confidence": 0.998 + }, + { + "text": "téléphone?", + "start": 62.68, + "end": 63.12, + "confidence": 0.999 + } + ] + }, + { + "id": 13, + "seek": 4884, + "start": 63.36, + "end": 66.66, + "text": " Il n'y a pas d'équivalent en fait.", + "tokens": [ + 4416, + 297, + 6, + 88, + 257, + 1736, + 274, + 6, + 20183, + 3576, + 317, + 465, + 3887, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.10746372298689078, + "compression_ratio": 1.662379421221865, + "no_speech_prob": 1.3105129255563952e-05, + "confidence": 0.936, + "words": [ + { + "text": "Il", + "start": 63.36, + "end": 65.42, + "confidence": 0.779 + }, + { + "text": "n'y", + "start": 65.42, + "end": 65.48, + "confidence": 0.978 + }, + { + "text": "a", + "start": 65.48, + "end": 65.54, + "confidence": 0.992 + }, + { + "text": "pas", + "start": 65.54, + "end": 65.66, + "confidence": 0.999 + }, + { + "text": "d'équivalent", + "start": 65.66, + "end": 66.22, + "confidence": 0.995 + }, + { + "text": "en", + "start": 66.22, + "end": 66.42, + "confidence": 0.601 + }, + { + "text": "fait.", + "start": 66.42, + "end": 66.66, + "confidence": 0.996 + } + ] + }, + { + "id": 14, + "seek": 4884, + "start": 66.88, + "end": 71.52, + "text": " Et donc cette espèce de nouveauté dans la relation à l'objet, c'est fascinant et terrifiant.", + "tokens": [ + 3790, + 5926, + 5550, + 7089, + 30236, + 368, + 11456, + 1375, + 526, + 2680, + 635, + 9721, + 1531, + 287, + 6, + 996, + 7108, + 11, + 269, + 6, + 377, + 7184, + 259, + 394, + 1030, + 7245, + 351, + 5798, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.10746372298689078, + "compression_ratio": 1.662379421221865, + "no_speech_prob": 1.3105129255563952e-05, + "confidence": 0.953, + "words": [ + { + "text": "Et", + "start": 66.88, + "end": 66.98, + "confidence": 0.599 + }, + { + "text": "donc", + "start": 66.98, + "end": 67.08, + "confidence": 0.901 + }, + { + "text": "cette", + "start": 67.08, + "end": 67.28, + "confidence": 0.71 + }, + { + "text": "espèce", + "start": 67.28, + "end": 67.54, + "confidence": 0.995 + }, + { + "text": "de", + "start": 67.54, + "end": 67.68, + "confidence": 0.999 + }, + { + "text": "nouveauté", + "start": 67.68, + "end": 68.48, + "confidence": 0.979 + }, + { + "text": "dans", + "start": 68.48, + "end": 68.66, + "confidence": 0.98 + }, + { + "text": "la", + "start": 68.66, + "end": 68.94, + "confidence": 0.995 + }, + { + "text": "relation", + "start": 68.94, + "end": 69.22, + "confidence": 0.998 + }, + { + "text": "à", + "start": 69.22, + "end": 69.38, + "confidence": 0.997 + }, + { + "text": "l'objet,", + "start": 69.38, + "end": 70.24, + "confidence": 0.997 + }, + { + "text": "c'est", + "start": 70.24, + "end": 70.38, + "confidence": 0.98 + }, + { + "text": "fascinant", + "start": 70.38, + "end": 70.64, + "confidence": 0.978 + }, + { + "text": "et", + "start": 70.64, + "end": 70.76, + "confidence": 0.964 + }, + { + "text": "terrifiant.", + "start": 70.76, + "end": 71.52, + "confidence": 0.977 + } + ] + }, + { + "id": 15, + "seek": 4884, + "start": 71.62, + "end": 76.48, + "text": " Parce qu'on a l'impression, comme le disent les utilisateurs et les services, d'être dépendants de cet objet,", + "tokens": [ + 20429, + 421, + 6, + 266, + 257, + 287, + 6, + 36107, + 11, + 5173, + 476, + 37313, + 1512, + 33643, + 25929, + 1030, + 1512, + 3328, + 11, + 274, + 6, + 9498, + 45768, + 1719, + 368, + 8603, + 14964, + 11 + ], + "temperature": 0.0, + "avg_logprob": -0.10746372298689078, + "compression_ratio": 1.662379421221865, + "no_speech_prob": 1.3105129255563952e-05, + "confidence": 0.813, + "words": [ + { + "text": "Parce", + "start": 71.62, + "end": 71.86, + "confidence": 0.512 + }, + { + "text": "qu'on", + "start": 71.86, + "end": 72.12, + "confidence": 0.937 + }, + { + "text": "a", + "start": 72.12, + "end": 72.44, + "confidence": 0.982 + }, + { + "text": "l'impression,", + "start": 72.44, + "end": 73.56, + "confidence": 0.998 + }, + { + "text": "comme", + "start": 73.56, + "end": 73.84, + "confidence": 0.964 + }, + { + "text": "le", + "start": 73.84, + "end": 74.0, + "confidence": 0.984 + }, + { + "text": "disent", + "start": 74.0, + "end": 74.2, + "confidence": 0.998 + }, + { + "text": "les", + "start": 74.2, + "end": 74.4, + "confidence": 0.994 + }, + { + "text": "utilisateurs", + "start": 74.4, + "end": 74.84, + "confidence": 0.997 + }, + { + "text": "et", + "start": 74.84, + "end": 74.96, + "confidence": 0.329 + }, + { + "text": "les", + "start": 74.96, + "end": 75.0, + "confidence": 0.773 + }, + { + "text": "services,", + "start": 75.0, + "end": 75.22, + "confidence": 0.214 + }, + { + "text": "d'être", + "start": 75.22, + "end": 75.42, + "confidence": 0.766 + }, + { + "text": "dépendants", + "start": 75.42, + "end": 75.96, + "confidence": 0.789 + }, + { + "text": "de", + "start": 75.96, + "end": 76.08, + "confidence": 0.986 + }, + { + "text": "cet", + "start": 76.08, + "end": 76.26, + "confidence": 0.996 + }, + { + "text": "objet,", + "start": 76.26, + "end": 76.48, + "confidence": 0.996 + } + ] + }, + { + "id": 16, + "seek": 7684, + "start": 76.86, + "end": 83.26, + "text": " d'induire en fait une espèce de relation, de médiation avec le monde qui rend de l'ampleur et qui amène aussi à des formes de rejet.", + "tokens": [ + 274, + 6, + 471, + 43612, + 465, + 3887, + 2251, + 7089, + 30236, + 368, + 9721, + 11, + 368, + 42436, + 399, + 4163, + 476, + 10431, + 1956, + 6125, + 368, + 287, + 6, + 335, + 781, + 374, + 1030, + 1956, + 669, + 18832, + 6212, + 1531, + 730, + 1254, + 279, + 368, + 319, + 7108, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.06937986261704389, + "compression_ratio": 1.6787003610108304, + "no_speech_prob": 5.948771558905719e-06, + "confidence": 0.917, + "words": [ + { + "text": "d'induire", + "start": 76.86, + "end": 77.08, + "confidence": 0.841 + }, + { + "text": "en", + "start": 77.08, + "end": 77.24, + "confidence": 0.618 + }, + { + "text": "fait", + "start": 77.24, + "end": 77.34, + "confidence": 0.994 + }, + { + "text": "une", + "start": 77.34, + "end": 77.52, + "confidence": 0.983 + }, + { + "text": "espèce", + "start": 77.52, + "end": 77.88, + "confidence": 0.996 + }, + { + "text": "de", + "start": 77.88, + "end": 78.48, + "confidence": 0.997 + }, + { + "text": "relation,", + "start": 78.48, + "end": 78.6, + "confidence": 0.596 + }, + { + "text": "de", + "start": 78.6, + "end": 78.94, + "confidence": 0.987 + }, + { + "text": "médiation", + "start": 78.94, + "end": 79.52, + "confidence": 0.997 + }, + { + "text": "avec", + "start": 79.52, + "end": 79.74, + "confidence": 0.967 + }, + { + "text": "le", + "start": 79.74, + "end": 79.92, + "confidence": 0.998 + }, + { + "text": "monde", + "start": 79.92, + "end": 80.64, + "confidence": 0.992 + }, + { + "text": "qui", + "start": 80.64, + "end": 81.1, + "confidence": 0.696 + }, + { + "text": "rend", + "start": 81.1, + "end": 81.64, + "confidence": 0.91 + }, + { + "text": "de", + "start": 81.64, + "end": 81.78, + "confidence": 0.712 + }, + { + "text": "l'ampleur", + "start": 81.78, + "end": 82.02, + "confidence": 0.987 + }, + { + "text": "et", + "start": 82.02, + "end": 82.12, + "confidence": 0.931 + }, + { + "text": "qui", + "start": 82.12, + "end": 82.24, + "confidence": 0.976 + }, + { + "text": "amène", + "start": 82.24, + "end": 82.36, + "confidence": 0.973 + }, + { + "text": "aussi", + "start": 82.36, + "end": 82.56, + "confidence": 0.938 + }, + { + "text": "à", + "start": 82.56, + "end": 82.62, + "confidence": 0.941 + }, + { + "text": "des", + "start": 82.62, + "end": 82.72, + "confidence": 0.992 + }, + { + "text": "formes", + "start": 82.72, + "end": 82.9, + "confidence": 0.993 + }, + { + "text": "de", + "start": 82.9, + "end": 83.02, + "confidence": 0.998 + }, + { + "text": "rejet.", + "start": 83.02, + "end": 83.26, + "confidence": 0.883 + } + ] + }, + { + "id": 17, + "seek": 7684, + "start": 83.94, + "end": 87.8, + "text": " Donc, à objet inédit, rapport inédit.", + "tokens": [ + 7477, + 11, + 1531, + 14964, + 294, + 7811, + 270, + 11, + 18018, + 294, + 7811, + 270, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.06937986261704389, + "compression_ratio": 1.6787003610108304, + "no_speech_prob": 5.948771558905719e-06, + "confidence": 0.962, + "words": [ + { + "text": "Donc,", + "start": 83.94, + "end": 84.94, + "confidence": 0.971 + }, + { + "text": "à", + "start": 84.94, + "end": 84.98, + "confidence": 0.88 + }, + { + "text": "objet", + "start": 84.98, + "end": 85.36, + "confidence": 0.828 + }, + { + "text": "inédit,", + "start": 85.36, + "end": 86.56, + "confidence": 0.993 + }, + { + "text": "rapport", + "start": 86.56, + "end": 87.0, + "confidence": 0.981 + }, + { + "text": "inédit.", + "start": 87.0, + "end": 87.8, + "confidence": 0.998 + } + ] + }, + { + "id": 18, + "seek": 7684, + "start": 88.02, + "end": 95.14, + "text": " Et ce rapport, si j'en crois Nicolas, serait caractérisé par un mélange de dépendance et de rejet.", + "tokens": [ + 3790, + 1769, + 18018, + 11, + 1511, + 361, + 6, + 268, + 21724, + 38268, + 11, + 23139, + 1032, + 578, + 4198, + 22118, + 971, + 517, + 41953, + 933, + 368, + 45768, + 719, + 1030, + 368, + 319, + 7108, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.06937986261704389, + "compression_ratio": 1.6787003610108304, + "no_speech_prob": 5.948771558905719e-06, + "confidence": 0.972, + "words": [ + { + "text": "Et", + "start": 88.02, + "end": 88.48, + "confidence": 0.992 + }, + { + "text": "ce", + "start": 88.48, + "end": 88.86, + "confidence": 0.975 + }, + { + "text": "rapport,", + "start": 88.86, + "end": 89.28, + "confidence": 0.998 + }, + { + "text": "si", + "start": 89.28, + "end": 89.56, + "confidence": 0.999 + }, + { + "text": "j'en", + "start": 89.56, + "end": 89.84, + "confidence": 0.996 + }, + { + "text": "crois", + "start": 89.84, + "end": 89.88, + "confidence": 0.984 + }, + { + "text": "Nicolas,", + "start": 89.88, + "end": 90.54, + "confidence": 0.681 + }, + { + "text": "serait", + "start": 90.54, + "end": 90.94, + "confidence": 0.885 + }, + { + "text": "caractérisé", + "start": 90.94, + "end": 91.8, + "confidence": 0.993 + }, + { + "text": "par", + "start": 91.8, + "end": 92.12, + "confidence": 0.997 + }, + { + "text": "un", + "start": 92.12, + "end": 92.44, + "confidence": 0.997 + }, + { + "text": "mélange", + "start": 92.44, + "end": 92.98, + "confidence": 0.999 + }, + { + "text": "de", + "start": 92.98, + "end": 93.4, + "confidence": 0.998 + }, + { + "text": "dépendance", + "start": 93.4, + "end": 94.24, + "confidence": 0.953 + }, + { + "text": "et", + "start": 94.24, + "end": 94.54, + "confidence": 0.998 + }, + { + "text": "de", + "start": 94.54, + "end": 94.68, + "confidence": 0.999 + }, + { + "text": "rejet.", + "start": 94.68, + "end": 95.14, + "confidence": 0.993 + } + ] + }, + { + "id": 19, + "seek": 7684, + "start": 95.78, + "end": 102.86, + "text": " Bon, en vrai, il faudrait remonter très très finement toute l'histoire des objets techniques et de leur insertion dans nos vies", + "tokens": [ + 7368, + 11, + 465, + 17815, + 11, + 1930, + 38694, + 8645, + 890, + 41806, + 5732, + 5732, + 962, + 1712, + 14953, + 287, + 6, + 29093, + 730, + 1111, + 25349, + 7512, + 1030, + 368, + 9580, + 8969, + 313, + 2680, + 3269, + 371, + 530 + ], + "temperature": 0.0, + "avg_logprob": -0.06937986261704389, + "compression_ratio": 1.6787003610108304, + "no_speech_prob": 5.948771558905719e-06, + "confidence": 0.941, + "words": [ + { + "text": "Bon,", + "start": 95.78, + "end": 96.38, + "confidence": 0.792 + }, + { + "text": "en", + "start": 96.38, + "end": 96.52, + "confidence": 0.998 + }, + { + "text": "vrai,", + "start": 96.52, + "end": 97.14, + "confidence": 0.994 + }, + { + "text": "il", + "start": 97.14, + "end": 97.18, + "confidence": 0.998 + }, + { + "text": "faudrait", + "start": 97.18, + "end": 97.58, + "confidence": 0.997 + }, + { + "text": "remonter", + "start": 97.58, + "end": 98.08, + "confidence": 0.997 + }, + { + "text": "très", + "start": 98.08, + "end": 98.6, + "confidence": 0.997 + }, + { + "text": "très", + "start": 98.6, + "end": 98.7, + "confidence": 0.768 + }, + { + "text": "finement", + "start": 98.7, + "end": 99.32, + "confidence": 0.849 + }, + { + "text": "toute", + "start": 99.32, + "end": 99.7, + "confidence": 0.984 + }, + { + "text": "l'histoire", + "start": 99.7, + "end": 100.06, + "confidence": 0.997 + }, + { + "text": "des", + "start": 100.06, + "end": 100.24, + "confidence": 0.998 + }, + { + "text": "objets", + "start": 100.24, + "end": 100.48, + "confidence": 0.999 + }, + { + "text": "techniques", + "start": 100.48, + "end": 101.02, + "confidence": 0.984 + }, + { + "text": "et", + "start": 101.02, + "end": 101.48, + "confidence": 0.527 + }, + { + "text": "de", + "start": 101.48, + "end": 101.68, + "confidence": 0.994 + }, + { + "text": "leur", + "start": 101.68, + "end": 101.84, + "confidence": 0.833 + }, + { + "text": "insertion", + "start": 101.84, + "end": 102.32, + "confidence": 0.994 + }, + { + "text": "dans", + "start": 102.32, + "end": 102.48, + "confidence": 0.99 + }, + { + "text": "nos", + "start": 102.48, + "end": 102.66, + "confidence": 0.998 + }, + { + "text": "vies", + "start": 102.66, + "end": 102.86, + "confidence": 0.998 + } + ] + }, + { + "id": 20, + "seek": 7684, + "start": 102.9, + "end": 105.74, + "text": " pour déterminer si ce rapport est totalement inédit.", + "tokens": [ + 2016, + 2795, + 29725, + 260, + 1511, + 1769, + 18018, + 871, + 45203, + 294, + 7811, + 270, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.06937986261704389, + "compression_ratio": 1.6787003610108304, + "no_speech_prob": 5.948771558905719e-06, + "confidence": 0.981, + "words": [ + { + "text": "pour", + "start": 102.9, + "end": 103.06, + "confidence": 0.822 + }, + { + "text": "déterminer", + "start": 103.06, + "end": 103.66, + "confidence": 0.997 + }, + { + "text": "si", + "start": 103.66, + "end": 103.76, + "confidence": 0.992 + }, + { + "text": "ce", + "start": 103.76, + "end": 103.94, + "confidence": 0.997 + }, + { + "text": "rapport", + "start": 103.94, + "end": 104.26, + "confidence": 0.997 + }, + { + "text": "est", + "start": 104.26, + "end": 104.74, + "confidence": 0.998 + }, + { + "text": "totalement", + "start": 104.74, + "end": 105.3, + "confidence": 0.999 + }, + { + "text": "inédit.", + "start": 105.3, + "end": 105.74, + "confidence": 0.999 + } + ] + }, + { + "id": 21, + "seek": 10584, + "start": 106.1, + "end": 109.34, + "text": " Mais j'ai l'impression comme ça que Nicolas ne se trompe pas vraiment.", + "tokens": [ + 6313, + 361, + 6, + 1301, + 287, + 6, + 36107, + 5173, + 2788, + 631, + 38268, + 408, + 369, + 504, + 298, + 494, + 1736, + 8322, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.07386374800172571, + "compression_ratio": 1.685512367491166, + "no_speech_prob": 5.46344235772267e-05, + "confidence": 0.94, + "words": [ + { + "text": "Mais", + "start": 106.1, + "end": 106.36, + "confidence": 0.947 + }, + { + "text": "j'ai", + "start": 106.36, + "end": 106.92, + "confidence": 0.941 + }, + { + "text": "l'impression", + "start": 106.92, + "end": 107.36, + "confidence": 0.996 + }, + { + "text": "comme", + "start": 107.36, + "end": 107.56, + "confidence": 0.641 + }, + { + "text": "ça", + "start": 107.56, + "end": 107.82, + "confidence": 0.978 + }, + { + "text": "que", + "start": 107.82, + "end": 107.96, + "confidence": 0.976 + }, + { + "text": "Nicolas", + "start": 107.96, + "end": 108.46, + "confidence": 0.985 + }, + { + "text": "ne", + "start": 108.46, + "end": 108.66, + "confidence": 0.726 + }, + { + "text": "se", + "start": 108.66, + "end": 108.7, + "confidence": 0.991 + }, + { + "text": "trompe", + "start": 108.7, + "end": 108.88, + "confidence": 0.995 + }, + { + "text": "pas", + "start": 108.88, + "end": 109.08, + "confidence": 0.999 + }, + { + "text": "vraiment.", + "start": 109.08, + "end": 109.34, + "confidence": 0.991 + } + ] + }, + { + "id": 22, + "seek": 10584, + "start": 109.88, + "end": 114.98, + "text": " Pour autant que je sache, il y a eu plein de discussions autour de la voiture ou même du téléphone.", + "tokens": [ + 8732, + 34081, + 631, + 1506, + 262, + 6000, + 11, + 1930, + 288, + 257, + 2228, + 21088, + 368, + 11088, + 30249, + 368, + 635, + 38859, + 2820, + 5698, + 1581, + 47159, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.07386374800172571, + "compression_ratio": 1.685512367491166, + "no_speech_prob": 5.46344235772267e-05, + "confidence": 0.969, + "words": [ + { + "text": "Pour", + "start": 109.88, + "end": 110.08, + "confidence": 0.997 + }, + { + "text": "autant", + "start": 110.08, + "end": 110.24, + "confidence": 1.0 + }, + { + "text": "que", + "start": 110.24, + "end": 110.42, + "confidence": 0.988 + }, + { + "text": "je", + "start": 110.42, + "end": 110.52, + "confidence": 0.998 + }, + { + "text": "sache,", + "start": 110.52, + "end": 111.14, + "confidence": 0.963 + }, + { + "text": "il", + "start": 111.14, + "end": 111.18, + "confidence": 0.997 + }, + { + "text": "y", + "start": 111.18, + "end": 111.32, + "confidence": 0.992 + }, + { + "text": "a", + "start": 111.32, + "end": 111.36, + "confidence": 0.993 + }, + { + "text": "eu", + "start": 111.36, + "end": 111.68, + "confidence": 0.998 + }, + { + "text": "plein", + "start": 111.68, + "end": 111.88, + "confidence": 0.974 + }, + { + "text": "de", + "start": 111.88, + "end": 112.06, + "confidence": 0.997 + }, + { + "text": "discussions", + "start": 112.06, + "end": 112.6, + "confidence": 0.799 + }, + { + "text": "autour", + "start": 112.6, + "end": 112.94, + "confidence": 0.995 + }, + { + "text": "de", + "start": 112.94, + "end": 113.46, + "confidence": 0.997 + }, + { + "text": "la", + "start": 113.46, + "end": 113.52, + "confidence": 0.998 + }, + { + "text": "voiture", + "start": 113.52, + "end": 113.86, + "confidence": 1.0 + }, + { + "text": "ou", + "start": 113.86, + "end": 114.06, + "confidence": 0.765 + }, + { + "text": "même", + "start": 114.06, + "end": 114.44, + "confidence": 0.996 + }, + { + "text": "du", + "start": 114.44, + "end": 114.6, + "confidence": 0.995 + }, + { + "text": "téléphone.", + "start": 114.6, + "end": 114.98, + "confidence": 0.999 + } + ] + }, + { + "id": 23, + "seek": 10584, + "start": 115.34, + "end": 119.84, + "text": " Mais la dépendance n'était pas du même ordre. Donc le rejet non plus n'était pas du même ordre.", + "tokens": [ + 6313, + 635, + 45768, + 719, + 297, + 6, + 9743, + 1736, + 1581, + 5698, + 4792, + 265, + 13, + 7477, + 476, + 319, + 7108, + 2107, + 1804, + 297, + 6, + 9743, + 1736, + 1581, + 5698, + 4792, + 265, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.07386374800172571, + "compression_ratio": 1.685512367491166, + "no_speech_prob": 5.46344235772267e-05, + "confidence": 0.972, + "words": [ + { + "text": "Mais", + "start": 115.34, + "end": 115.72, + "confidence": 0.994 + }, + { + "text": "la", + "start": 115.72, + "end": 116.02, + "confidence": 0.937 + }, + { + "text": "dépendance", + "start": 116.02, + "end": 116.4, + "confidence": 0.997 + }, + { + "text": "n'était", + "start": 116.4, + "end": 116.62, + "confidence": 0.994 + }, + { + "text": "pas", + "start": 116.62, + "end": 117.0, + "confidence": 0.998 + }, + { + "text": "du", + "start": 117.0, + "end": 117.16, + "confidence": 0.995 + }, + { + "text": "même", + "start": 117.16, + "end": 117.46, + "confidence": 0.999 + }, + { + "text": "ordre.", + "start": 117.46, + "end": 117.78, + "confidence": 0.999 + }, + { + "text": "Donc", + "start": 117.78, + "end": 117.98, + "confidence": 0.804 + }, + { + "text": "le", + "start": 117.98, + "end": 118.34, + "confidence": 0.715 + }, + { + "text": "rejet", + "start": 118.34, + "end": 118.62, + "confidence": 0.999 + }, + { + "text": "non", + "start": 118.62, + "end": 118.78, + "confidence": 0.975 + }, + { + "text": "plus", + "start": 118.78, + "end": 118.94, + "confidence": 0.996 + }, + { + "text": "n'était", + "start": 118.94, + "end": 119.12, + "confidence": 0.987 + }, + { + "text": "pas", + "start": 119.12, + "end": 119.3, + "confidence": 0.998 + }, + { + "text": "du", + "start": 119.3, + "end": 119.38, + "confidence": 0.995 + }, + { + "text": "même", + "start": 119.38, + "end": 119.56, + "confidence": 0.999 + }, + { + "text": "ordre.", + "start": 119.56, + "end": 119.84, + "confidence": 0.999 + } + ] + }, + { + "id": 24, + "seek": 10584, + "start": 119.98, + "end": 123.02, + "text": " On peut adorer sa bagnole, en avoir besoin pour plein de choses.", + "tokens": [ + 1282, + 5977, + 614, + 17618, + 601, + 3411, + 1771, + 306, + 11, + 465, + 10853, + 19207, + 2016, + 21088, + 368, + 14488, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.07386374800172571, + "compression_ratio": 1.685512367491166, + "no_speech_prob": 5.46344235772267e-05, + "confidence": 0.991, + "words": [ + { + "text": "On", + "start": 119.98, + "end": 120.18, + "confidence": 0.996 + }, + { + "text": "peut", + "start": 120.18, + "end": 120.38, + "confidence": 0.997 + }, + { + "text": "adorer", + "start": 120.38, + "end": 120.66, + "confidence": 0.99 + }, + { + "text": "sa", + "start": 120.66, + "end": 120.88, + "confidence": 0.985 + }, + { + "text": "bagnole,", + "start": 120.88, + "end": 121.46, + "confidence": 0.984 + }, + { + "text": "en", + "start": 121.46, + "end": 121.56, + "confidence": 0.989 + }, + { + "text": "avoir", + "start": 121.56, + "end": 121.74, + "confidence": 0.998 + }, + { + "text": "besoin", + "start": 121.74, + "end": 122.1, + "confidence": 0.999 + }, + { + "text": "pour", + "start": 122.1, + "end": 122.34, + "confidence": 0.987 + }, + { + "text": "plein", + "start": 122.34, + "end": 122.68, + "confidence": 0.989 + }, + { + "text": "de", + "start": 122.68, + "end": 122.8, + "confidence": 0.998 + }, + { + "text": "choses.", + "start": 122.8, + "end": 123.02, + "confidence": 0.989 + } + ] + }, + { + "id": 25, + "seek": 10584, + "start": 123.28, + "end": 126.36, + "text": " Et bien, le soir, quand on va se coucher, on la laisse.", + "tokens": [ + 3790, + 3610, + 11, + 476, + 27105, + 11, + 6932, + 322, + 2773, + 369, + 1384, + 6759, + 11, + 322, + 635, + 30969, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.07386374800172571, + "compression_ratio": 1.685512367491166, + "no_speech_prob": 5.46344235772267e-05, + "confidence": 0.895, + "words": [ + { + "text": "Et", + "start": 123.28, + "end": 123.46, + "confidence": 0.667 + }, + { + "text": "bien,", + "start": 123.46, + "end": 123.86, + "confidence": 0.469 + }, + { + "text": "le", + "start": 123.86, + "end": 123.98, + "confidence": 0.996 + }, + { + "text": "soir,", + "start": 123.98, + "end": 124.68, + "confidence": 0.999 + }, + { + "text": "quand", + "start": 124.68, + "end": 124.9, + "confidence": 0.997 + }, + { + "text": "on", + "start": 124.9, + "end": 125.02, + "confidence": 0.998 + }, + { + "text": "va", + "start": 125.02, + "end": 125.14, + "confidence": 0.996 + }, + { + "text": "se", + "start": 125.14, + "end": 125.38, + "confidence": 0.988 + }, + { + "text": "coucher,", + "start": 125.38, + "end": 125.8, + "confidence": 0.987 + }, + { + "text": "on", + "start": 125.8, + "end": 126.02, + "confidence": 0.995 + }, + { + "text": "la", + "start": 126.02, + "end": 126.22, + "confidence": 0.802 + }, + { + "text": "laisse.", + "start": 126.22, + "end": 126.36, + "confidence": 0.999 + } + ] + }, + { + "id": 26, + "seek": 10584, + "start": 126.98, + "end": 130.48, + "text": " On ne l'a pas dans la main quand on est au lit, on ne l'emmène pas au chiottes.", + "tokens": [ + 1282, + 408, + 287, + 6, + 64, + 1736, + 2680, + 635, + 2135, + 6932, + 322, + 871, + 1609, + 7997, + 11, + 322, + 408, + 287, + 6, + 443, + 76, + 18832, + 1736, + 1609, + 13228, + 1521, + 279, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.07386374800172571, + "compression_ratio": 1.685512367491166, + "no_speech_prob": 5.46344235772267e-05, + "confidence": 0.914, + "words": [ + { + "text": "On", + "start": 126.98, + "end": 127.32, + "confidence": 0.954 + }, + { + "text": "ne", + "start": 127.32, + "end": 127.36, + "confidence": 0.803 + }, + { + "text": "l'a", + "start": 127.36, + "end": 127.48, + "confidence": 0.974 + }, + { + "text": "pas", + "start": 127.48, + "end": 127.68, + "confidence": 0.999 + }, + { + "text": "dans", + "start": 127.68, + "end": 127.8, + "confidence": 0.996 + }, + { + "text": "la", + "start": 127.8, + "end": 128.06, + "confidence": 0.994 + }, + { + "text": "main", + "start": 128.06, + "end": 128.26, + "confidence": 0.999 + }, + { + "text": "quand", + "start": 128.26, + "end": 128.44, + "confidence": 0.935 + }, + { + "text": "on", + "start": 128.44, + "end": 128.62, + "confidence": 0.997 + }, + { + "text": "est", + "start": 128.62, + "end": 128.68, + "confidence": 0.993 + }, + { + "text": "au", + "start": 128.68, + "end": 129.04, + "confidence": 0.984 + }, + { + "text": "lit,", + "start": 129.04, + "end": 129.14, + "confidence": 0.999 + }, + { + "text": "on", + "start": 129.14, + "end": 129.26, + "confidence": 0.427 + }, + { + "text": "ne", + "start": 129.26, + "end": 129.3, + "confidence": 0.963 + }, + { + "text": "l'emmène", + "start": 129.3, + "end": 129.5, + "confidence": 0.992 + }, + { + "text": "pas", + "start": 129.5, + "end": 129.68, + "confidence": 0.997 + }, + { + "text": "au", + "start": 129.68, + "end": 129.86, + "confidence": 0.674 + }, + { + "text": "chiottes.", + "start": 129.86, + "end": 130.48, + "confidence": 0.828 + } + ] + }, + { + "id": 27, + "seek": 13084, + "start": 130.86, + "end": 136.9, + "text": " On pouvait être énervé par son môme qui occupait la ligne de téléphone pendant une heure chaque soir pour discuter avec un copain.", + "tokens": [ + 1282, + 45913, + 7418, + 45045, + 15797, + 971, + 1872, + 275, + 2851, + 1398, + 1956, + 8073, + 1001, + 635, + 34207, + 368, + 47159, + 17338, + 2251, + 30027, + 18920, + 27105, + 2016, + 2983, + 20314, + 4163, + 517, + 2971, + 491, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.06199159333200166, + "compression_ratio": 1.6127167630057804, + "no_speech_prob": 1.6126719856401905e-05, + "confidence": 0.955, + "words": [ + { + "text": "On", + "start": 130.86, + "end": 131.04, + "confidence": 0.983 + }, + { + "text": "pouvait", + "start": 131.04, + "end": 131.28, + "confidence": 0.989 + }, + { + "text": "être", + "start": 131.28, + "end": 131.48, + "confidence": 0.996 + }, + { + "text": "énervé", + "start": 131.48, + "end": 132.22, + "confidence": 0.906 + }, + { + "text": "par", + "start": 132.22, + "end": 132.44, + "confidence": 0.991 + }, + { + "text": "son", + "start": 132.44, + "end": 132.7, + "confidence": 0.998 + }, + { + "text": "môme", + "start": 132.7, + "end": 133.1, + "confidence": 0.832 + }, + { + "text": "qui", + "start": 133.1, + "end": 133.34, + "confidence": 0.919 + }, + { + "text": "occupait", + "start": 133.34, + "end": 133.76, + "confidence": 0.991 + }, + { + "text": "la", + "start": 133.76, + "end": 133.8, + "confidence": 0.992 + }, + { + "text": "ligne", + "start": 133.8, + "end": 134.08, + "confidence": 0.999 + }, + { + "text": "de", + "start": 134.08, + "end": 134.14, + "confidence": 0.997 + }, + { + "text": "téléphone", + "start": 134.14, + "end": 134.6, + "confidence": 0.985 + }, + { + "text": "pendant", + "start": 134.6, + "end": 134.82, + "confidence": 0.981 + }, + { + "text": "une", + "start": 134.82, + "end": 135.2, + "confidence": 0.87 + }, + { + "text": "heure", + "start": 135.2, + "end": 135.36, + "confidence": 0.998 + }, + { + "text": "chaque", + "start": 135.36, + "end": 135.54, + "confidence": 0.991 + }, + { + "text": "soir", + "start": 135.54, + "end": 135.8, + "confidence": 0.996 + }, + { + "text": "pour", + "start": 135.8, + "end": 135.96, + "confidence": 0.79 + }, + { + "text": "discuter", + "start": 135.96, + "end": 136.28, + "confidence": 0.997 + }, + { + "text": "avec", + "start": 136.28, + "end": 136.48, + "confidence": 0.996 + }, + { + "text": "un", + "start": 136.48, + "end": 136.6, + "confidence": 0.999 + }, + { + "text": "copain.", + "start": 136.6, + "end": 136.9, + "confidence": 0.998 + } + ] + }, + { + "id": 28, + "seek": 13084, + "start": 137.28, + "end": 141.88, + "text": " Mais ça ne ressemblait pas à ce qu'on peut ressentir à voir ce même môme aujourd'hui,", + "tokens": [ + 6313, + 2788, + 408, + 725, + 15750, + 35235, + 1736, + 1531, + 1769, + 421, + 6, + 266, + 5977, + 24689, + 317, + 347, + 1531, + 10695, + 1769, + 5698, + 275, + 2851, + 1398, + 14023, + 6, + 10556, + 11 + ], + "temperature": 0.0, + "avg_logprob": -0.06199159333200166, + "compression_ratio": 1.6127167630057804, + "no_speech_prob": 1.6126719856401905e-05, + "confidence": 0.959, + "words": [ + { + "text": "Mais", + "start": 137.28, + "end": 137.46, + "confidence": 0.993 + }, + { + "text": "ça", + "start": 137.46, + "end": 137.68, + "confidence": 0.938 + }, + { + "text": "ne", + "start": 137.68, + "end": 137.94, + "confidence": 0.998 + }, + { + "text": "ressemblait", + "start": 137.94, + "end": 138.4, + "confidence": 0.991 + }, + { + "text": "pas", + "start": 138.4, + "end": 138.76, + "confidence": 0.995 + }, + { + "text": "à", + "start": 138.76, + "end": 138.94, + "confidence": 0.988 + }, + { + "text": "ce", + "start": 138.94, + "end": 138.98, + "confidence": 0.998 + }, + { + "text": "qu'on", + "start": 138.98, + "end": 139.1, + "confidence": 0.986 + }, + { + "text": "peut", + "start": 139.1, + "end": 139.48, + "confidence": 0.988 + }, + { + "text": "ressentir", + "start": 139.48, + "end": 140.12, + "confidence": 0.997 + }, + { + "text": "à", + "start": 140.12, + "end": 140.32, + "confidence": 0.498 + }, + { + "text": "voir", + "start": 140.32, + "end": 140.46, + "confidence": 0.855 + }, + { + "text": "ce", + "start": 140.46, + "end": 140.68, + "confidence": 0.989 + }, + { + "text": "même", + "start": 140.68, + "end": 140.94, + "confidence": 0.984 + }, + { + "text": "môme", + "start": 140.94, + "end": 141.34, + "confidence": 0.998 + }, + { + "text": "aujourd'hui,", + "start": 141.34, + "end": 141.88, + "confidence": 0.988 + } + ] + }, + { + "id": 29, + "seek": 13084, + "start": 142.14, + "end": 146.3, + "text": " continuellement avec son smartphone dans la main, comme si c'était une sorte de pacemaker externe,", + "tokens": [ + 2354, + 285, + 1712, + 4163, + 1872, + 13307, + 2680, + 635, + 2135, + 11, + 5173, + 1511, + 269, + 6, + 9743, + 2251, + 25559, + 368, + 15165, + 49523, + 454, + 391, + 716, + 11 + ], + "temperature": 0.0, + "avg_logprob": -0.06199159333200166, + "compression_ratio": 1.6127167630057804, + "no_speech_prob": 1.6126719856401905e-05, + "confidence": 0.963, + "words": [ + { + "text": "continuellement", + "start": 142.14, + "end": 142.94, + "confidence": 0.971 + }, + { + "text": "avec", + "start": 142.94, + "end": 143.18, + "confidence": 0.805 + }, + { + "text": "son", + "start": 143.18, + "end": 143.38, + "confidence": 0.995 + }, + { + "text": "smartphone", + "start": 143.38, + "end": 143.76, + "confidence": 0.978 + }, + { + "text": "dans", + "start": 143.76, + "end": 143.94, + "confidence": 0.979 + }, + { + "text": "la", + "start": 143.94, + "end": 144.0, + "confidence": 0.996 + }, + { + "text": "main,", + "start": 144.0, + "end": 144.36, + "confidence": 0.998 + }, + { + "text": "comme", + "start": 144.36, + "end": 144.52, + "confidence": 0.835 + }, + { + "text": "si", + "start": 144.52, + "end": 144.64, + "confidence": 0.975 + }, + { + "text": "c'était", + "start": 144.64, + "end": 144.82, + "confidence": 0.991 + }, + { + "text": "une", + "start": 144.82, + "end": 145.06, + "confidence": 0.989 + }, + { + "text": "sorte", + "start": 145.06, + "end": 145.22, + "confidence": 0.997 + }, + { + "text": "de", + "start": 145.22, + "end": 145.3, + "confidence": 0.982 + }, + { + "text": "pacemaker", + "start": 145.3, + "end": 145.82, + "confidence": 0.917 + }, + { + "text": "externe,", + "start": 145.82, + "end": 146.3, + "confidence": 0.992 + } + ] + }, + { + "id": 30, + "seek": 13084, + "start": 146.34, + "end": 148.84, + "text": " comme si le lâcher allait entraîner sa mort immédiate.", + "tokens": [ + 5173, + 1511, + 476, + 48835, + 6759, + 439, + 1001, + 22284, + 7517, + 1193, + 601, + 6599, + 3397, + 526, + 4504, + 473, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.06199159333200166, + "compression_ratio": 1.6127167630057804, + "no_speech_prob": 1.6126719856401905e-05, + "confidence": 0.989, + "words": [ + { + "text": "comme", + "start": 146.34, + "end": 146.58, + "confidence": 0.996 + }, + { + "text": "si", + "start": 146.58, + "end": 146.76, + "confidence": 0.994 + }, + { + "text": "le", + "start": 146.76, + "end": 146.84, + "confidence": 0.997 + }, + { + "text": "lâcher", + "start": 146.84, + "end": 147.36, + "confidence": 0.969 + }, + { + "text": "allait", + "start": 147.36, + "end": 147.56, + "confidence": 0.993 + }, + { + "text": "entraîner", + "start": 147.56, + "end": 147.86, + "confidence": 0.978 + }, + { + "text": "sa", + "start": 147.86, + "end": 148.0, + "confidence": 0.999 + }, + { + "text": "mort", + "start": 148.0, + "end": 148.22, + "confidence": 0.998 + }, + { + "text": "immédiate.", + "start": 148.22, + "end": 148.84, + "confidence": 0.997 + } + ] + }, + { + "id": 31, + "seek": 13084, + "start": 149.04, + "end": 151.96, + "text": " Bon, je dis ça pour le môme, mais c'est évidemment valable pour nous aussi.", + "tokens": [ + 7368, + 11, + 1506, + 717, + 2788, + 2016, + 476, + 275, + 2851, + 1398, + 11, + 2420, + 269, + 6, + 377, + 24724, + 1323, + 712, + 2016, + 4666, + 6212, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.06199159333200166, + "compression_ratio": 1.6127167630057804, + "no_speech_prob": 1.6126719856401905e-05, + "confidence": 0.974, + "words": [ + { + "text": "Bon,", + "start": 149.04, + "end": 149.28, + "confidence": 0.918 + }, + { + "text": "je", + "start": 149.28, + "end": 149.32, + "confidence": 0.934 + }, + { + "text": "dis", + "start": 149.32, + "end": 149.46, + "confidence": 0.988 + }, + { + "text": "ça", + "start": 149.46, + "end": 149.64, + "confidence": 0.994 + }, + { + "text": "pour", + "start": 149.64, + "end": 149.74, + "confidence": 0.997 + }, + { + "text": "le", + "start": 149.74, + "end": 149.88, + "confidence": 0.995 + }, + { + "text": "môme,", + "start": 149.88, + "end": 150.32, + "confidence": 0.998 + }, + { + "text": "mais", + "start": 150.32, + "end": 150.52, + "confidence": 0.791 + }, + { + "text": "c'est", + "start": 150.52, + "end": 150.82, + "confidence": 0.981 + }, + { + "text": "évidemment", + "start": 150.82, + "end": 151.14, + "confidence": 0.98 + }, + { + "text": "valable", + "start": 151.14, + "end": 151.48, + "confidence": 0.998 + }, + { + "text": "pour", + "start": 151.48, + "end": 151.62, + "confidence": 0.997 + }, + { + "text": "nous", + "start": 151.62, + "end": 151.76, + "confidence": 0.999 + }, + { + "text": "aussi.", + "start": 151.76, + "end": 151.96, + "confidence": 0.996 + } + ] + }, + { + "id": 32, + "seek": 13084, + "start": 152.34, + "end": 158.22, + "text": " Donc, rapport inédit. D'accord. Mais pourquoi a-t-on l'impression qu'on n'en sortira jamais?", + "tokens": [ + 7477, + 11, + 18018, + 294, + 7811, + 270, + 13, + 413, + 6, + 19947, + 13, + 6313, + 19934, + 257, + 12, + 83, + 12, + 266, + 287, + 6, + 36107, + 421, + 6, + 266, + 297, + 6, + 268, + 1333, + 4271, + 14540, + 2506 + ], + "temperature": 0.0, + "avg_logprob": -0.06199159333200166, + "compression_ratio": 1.6127167630057804, + "no_speech_prob": 1.6126719856401905e-05, + "confidence": 0.948, + "words": [ + { + "text": "Donc,", + "start": 152.34, + "end": 153.46, + "confidence": 0.991 + }, + { + "text": "rapport", + "start": 153.46, + "end": 153.66, + "confidence": 0.976 + }, + { + "text": "inédit.", + "start": 153.66, + "end": 154.24, + "confidence": 0.996 + }, + { + "text": "D'accord.", + "start": 154.24, + "end": 155.48, + "confidence": 0.978 + }, + { + "text": "Mais", + "start": 155.48, + "end": 155.82, + "confidence": 0.557 + }, + { + "text": "pourquoi", + "start": 155.82, + "end": 156.32, + "confidence": 0.994 + }, + { + "text": "a-t-on", + "start": 156.32, + "end": 156.68, + "confidence": 0.94 + }, + { + "text": "l'impression", + "start": 156.68, + "end": 157.06, + "confidence": 0.999 + }, + { + "text": "qu'on", + "start": 157.06, + "end": 157.26, + "confidence": 0.995 + }, + { + "text": "n'en", + "start": 157.26, + "end": 157.44, + "confidence": 0.878 + }, + { + "text": "sortira", + "start": 157.44, + "end": 157.9, + "confidence": 0.989 + }, + { + "text": "jamais?", + "start": 157.9, + "end": 158.22, + "confidence": 0.998 + } + ] + }, + { + "id": 33, + "seek": 15884, + "start": 158.86, + "end": 165.32, + "text": " Est-ce qu'il faut en remettre la faute sur les gens qui ont créé cet outil merveilleux et diabolique, et diabolique parce que merveilleux?", + "tokens": [ + 4410, + 12, + 384, + 421, + 6, + 388, + 8487, + 465, + 890, + 40681, + 635, + 2050, + 1169, + 1022, + 1512, + 10668, + 1956, + 6592, + 15609, + 526, + 8603, + 484, + 388, + 3551, + 303, + 3409, + 2449, + 1030, + 1026, + 14923, + 1925, + 11, + 1030, + 1026, + 14923, + 1925, + 6992, + 631, + 3551, + 303, + 3409, + 2449, + 2506 + ], + "temperature": 0.0, + "avg_logprob": -0.079788723507443, + "compression_ratio": 1.6517857142857142, + "no_speech_prob": 5.4980162531137466e-05, + "confidence": 0.962, + "words": [ + { + "text": "Est-ce", + "start": 158.86, + "end": 159.34, + "confidence": 0.981 + }, + { + "text": "qu'il", + "start": 159.34, + "end": 159.46, + "confidence": 0.997 + }, + { + "text": "faut", + "start": 159.46, + "end": 159.62, + "confidence": 0.999 + }, + { + "text": "en", + "start": 159.62, + "end": 159.78, + "confidence": 0.97 + }, + { + "text": "remettre", + "start": 159.78, + "end": 160.12, + "confidence": 0.999 + }, + { + "text": "la", + "start": 160.12, + "end": 160.34, + "confidence": 0.998 + }, + { + "text": "faute", + "start": 160.34, + "end": 160.66, + "confidence": 0.986 + }, + { + "text": "sur", + "start": 160.66, + "end": 160.94, + "confidence": 0.995 + }, + { + "text": "les", + "start": 160.94, + "end": 161.28, + "confidence": 0.995 + }, + { + "text": "gens", + "start": 161.28, + "end": 161.44, + "confidence": 1.0 + }, + { + "text": "qui", + "start": 161.44, + "end": 161.58, + "confidence": 0.984 + }, + { + "text": "ont", + "start": 161.58, + "end": 161.72, + "confidence": 0.998 + }, + { + "text": "créé", + "start": 161.72, + "end": 162.3, + "confidence": 0.99 + }, + { + "text": "cet", + "start": 162.3, + "end": 162.46, + "confidence": 0.852 + }, + { + "text": "outil", + "start": 162.46, + "end": 162.78, + "confidence": 0.99 + }, + { + "text": "merveilleux", + "start": 162.78, + "end": 163.34, + "confidence": 0.994 + }, + { + "text": "et", + "start": 163.34, + "end": 163.5, + "confidence": 0.954 + }, + { + "text": "diabolique,", + "start": 163.5, + "end": 163.86, + "confidence": 0.992 + }, + { + "text": "et", + "start": 163.86, + "end": 163.92, + "confidence": 0.54 + }, + { + "text": "diabolique", + "start": 163.92, + "end": 164.4, + "confidence": 0.951 + }, + { + "text": "parce", + "start": 164.4, + "end": 164.66, + "confidence": 0.703 + }, + { + "text": "que", + "start": 164.66, + "end": 164.84, + "confidence": 0.99 + }, + { + "text": "merveilleux?", + "start": 164.84, + "end": 165.32, + "confidence": 0.997 + } + ] + }, + { + "id": 34, + "seek": 15884, + "start": 166.34, + "end": 168.82, + "text": " Les économistes parlent de dépendance du sentier.", + "tokens": [ + 6965, + 31171, + 22368, + 13734, + 317, + 368, + 45768, + 719, + 1581, + 2279, + 811, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.079788723507443, + "compression_ratio": 1.6517857142857142, + "no_speech_prob": 5.4980162531137466e-05, + "confidence": 0.984, + "words": [ + { + "text": "Les", + "start": 166.34, + "end": 167.04, + "confidence": 0.926 + }, + { + "text": "économistes", + "start": 167.04, + "end": 167.48, + "confidence": 0.998 + }, + { + "text": "parlent", + "start": 167.48, + "end": 167.68, + "confidence": 0.995 + }, + { + "text": "de", + "start": 167.68, + "end": 167.82, + "confidence": 0.995 + }, + { + "text": "dépendance", + "start": 167.82, + "end": 168.36, + "confidence": 0.985 + }, + { + "text": "du", + "start": 168.36, + "end": 168.5, + "confidence": 0.997 + }, + { + "text": "sentier.", + "start": 168.5, + "end": 168.82, + "confidence": 0.978 + } + ] + }, + { + "id": 35, + "seek": 16884, + "start": 168.86, + "end": 177.42, + "text": " C'est l'idée qu'on est sur un sentier qui a été établi, soit volontairement en marchant dessus, soit en définissant des bornes, en définissant une signalétique.", + "tokens": [ + 50364, + 383, + 6, + 377, + 287, + 6, + 34281, + 421, + 6, + 266, + 871, + 1022, + 517, + 2279, + 811, + 1956, + 257, + 8862, + 4823, + 455, + 2081, + 11, + 12703, + 40005, + 9020, + 518, + 465, + 8368, + 394, + 30677, + 11, + 12703, + 465, + 40763, + 29492, + 730, + 4232, + 279, + 11, + 465, + 40763, + 29492, + 2251, + 6358, + 42379, + 13, + 51414 + ], + "temperature": 0.0, + "avg_logprob": -0.10415018598238628, + "compression_ratio": 1.3916666666666666, + "no_speech_prob": 3.958350498578511e-05, + "confidence": 0.93, + "words": [ + { + "text": "C'est", + "start": 168.86, + "end": 169.1, + "confidence": 0.952 + }, + { + "text": "l'idée", + "start": 169.1, + "end": 169.34, + "confidence": 0.992 + }, + { + "text": "qu'on", + "start": 169.34, + "end": 169.7, + "confidence": 0.825 + }, + { + "text": "est", + "start": 169.7, + "end": 169.88, + "confidence": 0.631 + }, + { + "text": "sur", + "start": 169.88, + "end": 170.0, + "confidence": 0.993 + }, + { + "text": "un", + "start": 170.0, + "end": 170.54, + "confidence": 0.998 + }, + { + "text": "sentier", + "start": 170.54, + "end": 170.78, + "confidence": 0.99 + }, + { + "text": "qui", + "start": 170.78, + "end": 170.84, + "confidence": 0.961 + }, + { + "text": "a", + "start": 170.84, + "end": 170.94, + "confidence": 0.98 + }, + { + "text": "été", + "start": 170.94, + "end": 171.12, + "confidence": 0.996 + }, + { + "text": "établi,", + "start": 171.12, + "end": 171.9, + "confidence": 0.995 + }, + { + "text": "soit", + "start": 171.9, + "end": 172.12, + "confidence": 0.989 + }, + { + "text": "volontairement", + "start": 172.12, + "end": 172.72, + "confidence": 0.965 + }, + { + "text": "en", + "start": 172.72, + "end": 172.8, + "confidence": 0.941 + }, + { + "text": "marchant", + "start": 172.8, + "end": 173.06, + "confidence": 0.997 + }, + { + "text": "dessus,", + "start": 173.06, + "end": 174.24, + "confidence": 0.972 + }, + { + "text": "soit", + "start": 174.24, + "end": 174.92, + "confidence": 0.996 + }, + { + "text": "en", + "start": 174.92, + "end": 175.36, + "confidence": 0.991 + }, + { + "text": "définissant", + "start": 175.36, + "end": 175.5, + "confidence": 0.983 + }, + { + "text": "des", + "start": 175.5, + "end": 175.76, + "confidence": 0.984 + }, + { + "text": "bornes,", + "start": 175.76, + "end": 176.04, + "confidence": 0.975 + }, + { + "text": "en", + "start": 176.04, + "end": 176.08, + "confidence": 0.68 + }, + { + "text": "définissant", + "start": 176.08, + "end": 176.58, + "confidence": 0.997 + }, + { + "text": "une", + "start": 176.58, + "end": 176.82, + "confidence": 0.944 + }, + { + "text": "signalétique.", + "start": 176.82, + "end": 177.42, + "confidence": 0.642 + } + ] + } + ], + "language": "fr" +} \ No newline at end of file diff --git a/tests/expected/medium_auto/bonjour.wav.words.json b/tests/expected/medium_auto/bonjour.wav.words.json new file mode 100644 index 0000000000000000000000000000000000000000..da3af389c96084e047ab79e6e6e78b0436b0bff3 --- /dev/null +++ b/tests/expected/medium_auto/bonjour.wav.words.json @@ -0,0 +1,133 @@ +{ + "text": " Bonjour !", + "segments": [ + { + "id": 0, + "seek": 0, + "start": 0.14, + "end": 0.94, + "text": " Bonjour !", + "tokens": [ + 50364, + 25431, + 2298, + 50402 + ], + "temperature": 0.0, + "avg_logprob": -0.7046648502349854, + "compression_ratio": 0.5294117647058824, + "no_speech_prob": 0.08610370755195618, + "confidence": 0.964, + "words": [ + { + "text": "Bonjour !", + "start": 0.14, + "end": 0.94, + "confidence": 0.964 + } + ] + } + ], + "language": "fr", + "language_probs": { + "en": 0.010910450480878353, + "zh": 0.009780064225196838, + "de": 0.0010308112250640988, + "es": 0.00041648533078841865, + "ru": 0.0012629760894924402, + "ko": 0.0024727871641516685, + "fr": 0.9519104361534119, + "ja": 0.003029722487553954, + "pt": 0.007736667525023222, + "tr": 0.00019368366338312626, + "pl": 0.0013871078845113516, + "ca": 8.248044650827069e-06, + "nl": 0.0005183243192732334, + "ar": 0.0015965515049174428, + "sv": 0.00013311671500559896, + "it": 0.0024727871641516685, + "id": 7.948761049192399e-05, + "hi": 0.00010696228127926588, + "fi": 1.1814779099950101e-05, + "vi": 0.00038518596556968987, + "he": 7.351402746280655e-05, + "uk": 3.112779450020753e-05, + "el": 0.0002486947341822088, + "ms": 0.0003095056163147092, + "cs": 2.621223575260956e-05, + "ro": 4.9742080591386184e-05, + "da": 5.161494755157037e-06, + "hu": 1.5652040019631386e-05, + "ta": 2.540577042964287e-05, + "no": 6.423583727155346e-06, + "th": 0.00017361690697725862, + "ur": 2.3866510673542507e-05, + "hr": 3.603303866839269e-06, + "bg": 6.323995876300614e-06, + "lt": 2.4140632604030543e-07, + "la": 0.000605982553679496, + "mi": 9.43938794080168e-05, + "ml": 4.925132543576183e-06, + "cy": 0.0011864564148709178, + "sk": 6.562104317708872e-07, + "te": 6.627490620303433e-06, + "fa": 2.5011888283188455e-05, + "lv": 8.474158619264927e-08, + "bn": 2.8953361379535636e-06, + "sr": 7.596187145963995e-08, + "az": 6.497363358448638e-08, + "sl": 8.377933227166068e-06, + "kn": 2.687426103875623e-08, + "et": 7.596187145963995e-08, + "mk": 5.4287504269723286e-08, + "br": 0.0003294670023024082, + "eu": 1.1338299827912124e-06, + "is": 2.693082308269368e-07, + "hy": 1.5586363133479608e-07, + "ne": 1.0712341236285283e-07, + "mn": 4.876541765952425e-07, + "bs": 1.169821643998148e-06, + "kk": 5.915916645449215e-08, + "sq": 7.960735359802129e-08, + "sw": 9.346260412712581e-06, + "gl": 1.3180339010432363e-05, + "mr": 1.2523994996627152e-07, + "pa": 2.7785696943283256e-07, + "si": 7.628194452991011e-06, + "km": 0.00011565379827516153, + "sn": 8.073935896391049e-05, + "yo": 1.0105716683028731e-05, + "so": 8.132403195304505e-09, + "af": 6.36020956790162e-07, + "oc": 2.424235390208196e-05, + "ka": 9.433752445886512e-09, + "be": 6.524740911117988e-06, + "tg": 5.37519051491131e-09, + "sd": 3.2996334198287514e-07, + "gu": 2.5444039764010995e-08, + "am": 2.193413273232636e-08, + "yi": 6.261604426072154e-07, + "lo": 1.4110742085904349e-06, + "uz": 8.115323413271369e-10, + "fo": 2.0013287382880662e-07, + "ht": 3.547440201145946e-06, + "ps": 2.555125320213847e-06, + "tk": 4.633703643008857e-09, + "nn": 0.0005782325752079487, + "mt": 2.5643599244062898e-08, + "sa": 1.9479279217193834e-05, + "lb": 5.089128674029553e-09, + "my": 3.603303866839269e-06, + "bo": 1.7561102367835701e-06, + "tl": 2.7470186978462152e-05, + "mg": 1.2303933871748995e-08, + "as": 2.092969531020117e-08, + "tt": 1.5889033422311627e-09, + "haw": 0.00013521297660190612, + "ln": 5.272798944133683e-07, + "ha": 1.004217775602001e-08, + "ba": 5.949793546733417e-09, + "jw": 0.0002448391169309616, + "su": 6.848170475137749e-09 + } +} \ No newline at end of file diff --git a/tests/expected/medium_auto/bonjour_vous_allez_bien.mp3.words.json b/tests/expected/medium_auto/bonjour_vous_allez_bien.mp3.words.json new file mode 100644 index 0000000000000000000000000000000000000000..3685a9bb214825ee9e95617a328fb5cb9a0eb3e4 --- /dev/null +++ b/tests/expected/medium_auto/bonjour_vous_allez_bien.mp3.words.json @@ -0,0 +1,235 @@ +{ + "text": " Bonjour ! Est-ce que vous allez bien ? Bonjour ! Est-ce que vous allez bien ?", + "segments": [ + { + "id": 0, + "seek": 0, + "start": 0.42, + "end": 3.46, + "text": " Bonjour ! Est-ce que vous allez bien ?", + "tokens": [ + 50364, + 25431, + 2298, + 4410, + 12, + 384, + 631, + 2630, + 18146, + 3610, + 2506, + 50564 + ], + "temperature": 0.0, + "avg_logprob": -0.3616434610806979, + "compression_ratio": 0.8260869565217391, + "no_speech_prob": 0.07169149070978165, + "confidence": 0.936, + "words": [ + { + "text": "Bonjour !", + "start": 0.42, + "end": 1.92, + "confidence": 0.874 + }, + { + "text": "Est-ce", + "start": 1.92, + "end": 2.16, + "confidence": 0.885 + }, + { + "text": "que", + "start": 2.16, + "end": 2.24, + "confidence": 0.988 + }, + { + "text": "vous", + "start": 2.24, + "end": 2.38, + "confidence": 0.996 + }, + { + "text": "allez", + "start": 2.38, + "end": 2.58, + "confidence": 0.99 + }, + { + "text": "bien ?", + "start": 2.58, + "end": 3.46, + "confidence": 0.999 + } + ] + }, + { + "id": 1, + "seek": 3000, + "start": 32.94, + "end": 35.86, + "text": " Bonjour ! Est-ce que vous allez bien ?", + "tokens": [ + 50364, + 25431, + 2298, + 4410, + 12, + 384, + 631, + 2630, + 18146, + 3610, + 2506, + 50664 + ], + "temperature": 0.0, + "avg_logprob": -0.30651259422302246, + "compression_ratio": 0.8260869565217391, + "no_speech_prob": 0.40451279282569885, + "confidence": 0.933, + "words": [ + { + "text": "Bonjour !", + "start": 32.94, + "end": 34.44, + "confidence": 0.741 + }, + { + "text": "Est-ce", + "start": 34.44, + "end": 34.7, + "confidence": 0.921 + }, + { + "text": "que", + "start": 34.7, + "end": 34.76, + "confidence": 0.996 + }, + { + "text": "vous", + "start": 34.76, + "end": 34.9, + "confidence": 0.998 + }, + { + "text": "allez", + "start": 34.9, + "end": 35.1, + "confidence": 0.997 + }, + { + "text": "bien ?", + "start": 35.1, + "end": 35.86, + "confidence": 0.999 + } + ] + } + ], + "language": "fr", + "language_probs": { + "en": 0.06090574339032173, + "zh": 0.003715273691341281, + "de": 0.005754328332841396, + "es": 0.007161377463489771, + "ru": 0.0019886428490281105, + "ko": 0.0026760115288197994, + "fr": 0.7536683082580566, + "ja": 0.002848599338904023, + "pt": 0.0049219378270208836, + "tr": 0.0009844496380537748, + "pl": 0.0036009668838232756, + "ca": 2.1080166334286332e-05, + "nl": 0.002848599338904023, + "ar": 0.00263452366925776, + "sv": 0.00025680899852886796, + "it": 0.0036576741840690374, + "id": 0.00012321829854045063, + "hi": 0.00041684217285364866, + "fi": 8.468662417726591e-05, + "vi": 0.0002489078033249825, + "he": 4.325369809521362e-05, + "uk": 4.0003127651289105e-05, + "el": 7.591259782202542e-05, + "ms": 0.0007202387205325067, + "cs": 0.0002955853415187448, + "ro": 9.596251766197383e-05, + "da": 4.2583109461702406e-05, + "hu": 7.357701542787254e-05, + "ta": 7.634730536665302e-06, + "no": 5.383009556680918e-05, + "th": 0.00013745995238423347, + "ur": 7.243630534503609e-05, + "hr": 2.8528902475954965e-06, + "bg": 1.1824902685475536e-05, + "lt": 5.035650474383147e-07, + "la": 0.02311721071600914, + "mi": 0.00021966038912069052, + "ml": 1.4948076568543911e-05, + "cy": 0.006319893989712, + "sk": 8.255112334154546e-06, + "te": 1.980298475245945e-05, + "fa": 0.00011575288226595148, + "lv": 8.700824309926247e-07, + "bn": 1.1641573109955061e-05, + "sr": 9.02842458572195e-08, + "az": 3.33536695507064e-06, + "sl": 1.7205131371156313e-05, + "kn": 3.46094878977965e-07, + "et": 1.6255279433607939e-06, + "mk": 6.452324186057012e-08, + "br": 0.013589906506240368, + "eu": 2.0114837752771564e-05, + "is": 4.929352144245058e-06, + "hy": 1.0660472753443173e-06, + "ne": 2.0548598058667267e-06, + "mn": 5.0568687584018335e-05, + "bs": 3.441242597546079e-06, + "kk": 4.957580586051336e-07, + "sq": 1.9719890076430602e-07, + "sw": 7.754960279271472e-06, + "gl": 7.02076795278117e-05, + "mr": 1.785293193279358e-06, + "pa": 4.558905857265927e-06, + "si": 6.0051803302485496e-05, + "km": 0.001573145855218172, + "sn": 0.0003915869747288525, + "yo": 0.00011575288226595148, + "so": 1.5969655464687094e-07, + "af": 8.001128662726842e-06, + "oc": 0.0006356084486469626, + "ka": 1.0150930052077456e-07, + "be": 1.0766695595521014e-05, + "tg": 1.0071934752886591e-07, + "sd": 1.220026479131775e-05, + "gu": 1.4093170364049001e-07, + "am": 8.56593089793023e-07, + "yi": 1.3824710549670272e-05, + "lo": 8.001128662726842e-06, + "uz": 4.0063390827072e-08, + "fo": 2.388695975241717e-05, + "ht": 0.0004040172789245844, + "ps": 3.2836567243066384e-06, + "tk": 1.9719890076430602e-07, + "nn": 0.07120601832866669, + "mt": 1.1708239071595017e-06, + "sa": 0.0002910027396865189, + "lb": 6.671153300885635e-07, + "my": 2.7926684197154827e-05, + "bo": 7.516364803450415e-06, + "tl": 7.243630534503609e-05, + "mg": 5.61767421913828e-07, + "as": 1.0660472753443173e-06, + "tt": 2.5071027920375855e-08, + "haw": 0.014466380700469017, + "ln": 2.9727802029810846e-05, + "ha": 3.40729144454599e-07, + "ba": 2.0666269051616837e-07, + "jw": 0.006833434104919434, + "su": 3.46094878977965e-07 + } +} \ No newline at end of file diff --git a/tests/expected/medium_auto/empty.mp3.words.json b/tests/expected/medium_auto/empty.mp3.words.json new file mode 100644 index 0000000000000000000000000000000000000000..894bb497261294d3fb3b7b5a7efa0b4c19e4c765 --- /dev/null +++ b/tests/expected/medium_auto/empty.mp3.words.json @@ -0,0 +1,147 @@ +{ + "text": " Thanks for watching!", + "segments": [ + { + "id": 0, + "seek": 0, + "start": 0.0, + "end": 2.52, + "text": " Thanks for watching!", + "tokens": [ + 50364, + 2561, + 337, + 1976, + 0, + 50518 + ], + "temperature": 0.0, + "avg_logprob": -0.8084396634783063, + "compression_ratio": 0.7142857142857143, + "no_speech_prob": 0.43768733739852905, + "confidence": 0.369, + "words": [ + { + "text": "Thanks", + "start": 0.0, + "end": 1.5, + "confidence": 0.056 + }, + { + "text": "for", + "start": 1.5, + "end": 2.46, + "confidence": 0.948 + }, + { + "text": "watching!", + "start": 2.46, + "end": 2.52, + "confidence": 0.948 + } + ] + } + ], + "language": "en", + "language_probs": { + "en": 0.47364965081214905, + "zh": 0.014989392831921577, + "de": 0.0077763949520885944, + "es": 0.009985089302062988, + "ru": 0.07263652980327606, + "ko": 0.0810319036245346, + "fr": 0.008023244328796864, + "ja": 0.028444871306419373, + "pt": 0.011857587844133377, + "tr": 0.008675196208059788, + "pl": 0.005020818207412958, + "ca": 8.504862489644438e-05, + "nl": 0.0031914261635392904, + "ar": 0.005778925959020853, + "sv": 0.0022986982949078083, + "it": 0.0030932363588362932, + "id": 0.0014841509982943535, + "hi": 0.00324168405495584, + "fi": 0.0010042268550023437, + "vi": 0.0018761425744742155, + "he": 0.0002348267735214904, + "uk": 0.0007462779758498073, + "el": 0.0014161868020892143, + "ms": 0.0035050958395004272, + "cs": 0.000914358941372484, + "ro": 0.0007121034432202578, + "da": 0.0001516155753051862, + "hu": 0.0007820926839485765, + "ta": 0.0012694615870714188, + "no": 0.00027454033261165023, + "th": 0.0022279745899140835, + "ur": 0.0007462779758498073, + "hr": 6.833848601672798e-05, + "bg": 0.00011624769831541926, + "lt": 1.3456648048304487e-05, + "la": 0.010796455666422844, + "mi": 0.00033115886617451906, + "ml": 0.0007347080390900373, + "cy": 0.004942977800965309, + "sk": 6.941466563148424e-05, + "te": 0.000399453827412799, + "fa": 0.00016393551777582616, + "lv": 4.6504928832291625e-06, + "bn": 0.0001109243166865781, + "sr": 1.0057395911644562e-06, + "az": 9.596834615877015e-07, + "sl": 6.222290539881214e-05, + "kn": 1.6324765965691768e-06, + "et": 5.028381565352902e-06, + "mk": 1.6939416980221722e-07, + "br": 0.0001916600449476391, + "eu": 3.621807309173164e-06, + "is": 2.0842062440351583e-05, + "hy": 3.916107743862085e-06, + "ne": 8.161869118339382e-06, + "mn": 6.03085063630715e-05, + "bs": 8.161869118339382e-06, + "kk": 1.1758287428165204e-06, + "sq": 1.332388478658686e-06, + "sw": 5.0784856284735724e-05, + "gl": 5.406019772635773e-05, + "mr": 1.5097939467523247e-06, + "pa": 2.096141315632849e-06, + "si": 0.0002205993514508009, + "km": 0.0006383254658430815, + "sn": 0.00035251679946668446, + "yo": 3.657895649666898e-05, + "so": 7.75543043118887e-08, + "af": 1.1155952961416915e-05, + "oc": 7.910754902695771e-06, + "ka": 3.421856717977789e-07, + "be": 5.43697706234525e-06, + "tg": 4.3165474750139765e-08, + "sd": 2.1626799480145564e-06, + "gu": 1.4489052091448684e-07, + "am": 4.533224000624614e-07, + "yi": 2.338414788027876e-06, + "lo": 1.0000130714615807e-05, + "uz": 9.556565316870547e-09, + "fo": 7.66736593504902e-06, + "ht": 9.845093700278085e-06, + "ps": 4.79811478726333e-06, + "tk": 8.191367584231557e-08, + "nn": 0.21349063515663147, + "mt": 4.1925463278857933e-07, + "sa": 6.833848601672798e-05, + "lb": 4.0550212077050674e-08, + "my": 7.202823780971812e-06, + "bo": 8.290399819088634e-06, + "tl": 0.0013097586343064904, + "mg": 1.6418248094396404e-07, + "as": 3.36880560780628e-07, + "tt": 1.651226533283534e-08, + "haw": 0.0035050958395004272, + "ln": 3.0673325568386645e-07, + "ha": 1.2490343692661554e-07, + "ba": 7.877560648239523e-08, + "jw": 0.004942977800965309, + "su": 3.36880560780628e-07 + } +} \ No newline at end of file diff --git a/tests/expected/medium_auto/gaenswein15.mp3.words.json b/tests/expected/medium_auto/gaenswein15.mp3.words.json new file mode 100644 index 0000000000000000000000000000000000000000..e23e145f910be90eba7dd5a5f8e8a2fa74e40841 --- /dev/null +++ b/tests/expected/medium_auto/gaenswein15.mp3.words.json @@ -0,0 +1,417 @@ +{ + "text": " Die Wiederzulassung des Messbuchs von 1962 als Missale für die außerordentliche Form des römischen Rethus ist dann nicht so weitergegangen, wie sich Papst Benediktas gewünscht hatte. Das hat er als Emeritor so gemacht.", + "segments": [ + { + "id": 0, + "seek": 0, + "start": 0.84, + "end": 8.56, + "text": " Die Wiederzulassung des Messbuchs von 1962 als Missale für die außerordentliche Form des römischen Rethus", + "tokens": [ + 50364, + 3229, + 45742, + 89, + 425, + 40828, + 730, + 9847, + 65, + 37503, + 2957, + 39498, + 3907, + 5275, + 1220, + 2959, + 978, + 39428, + 765, + 7698, + 68, + 10126, + 730, + 367, + 32374, + 6282, + 497, + 3293, + 301, + 50814 + ], + "temperature": 0.0, + "avg_logprob": -0.28166988079364486, + "compression_ratio": 1.247191011235955, + "no_speech_prob": 0.2541781961917877, + "confidence": 0.869, + "words": [ + { + "text": "Die", + "start": 0.84, + "end": 1.12, + "confidence": 0.872 + }, + { + "text": "Wiederzulassung", + "start": 1.12, + "end": 1.92, + "confidence": 0.976 + }, + { + "text": "des", + "start": 1.92, + "end": 2.16, + "confidence": 0.986 + }, + { + "text": "Messbuchs", + "start": 2.16, + "end": 2.74, + "confidence": 0.947 + }, + { + "text": "von", + "start": 2.74, + "end": 3.28, + "confidence": 0.971 + }, + { + "text": "1962", + "start": 3.28, + "end": 4.9, + "confidence": 0.981 + }, + { + "text": "als", + "start": 4.9, + "end": 5.26, + "confidence": 0.925 + }, + { + "text": "Missale", + "start": 5.26, + "end": 5.76, + "confidence": 0.905 + }, + { + "text": "für", + "start": 5.76, + "end": 5.96, + "confidence": 0.955 + }, + { + "text": "die", + "start": 5.96, + "end": 6.12, + "confidence": 0.99 + }, + { + "text": "außerordentliche", + "start": 6.12, + "end": 7.06, + "confidence": 0.943 + }, + { + "text": "Form", + "start": 7.06, + "end": 7.32, + "confidence": 0.834 + }, + { + "text": "des", + "start": 7.32, + "end": 7.64, + "confidence": 0.863 + }, + { + "text": "römischen", + "start": 7.64, + "end": 8.04, + "confidence": 0.676 + }, + { + "text": "Rethus", + "start": 8.04, + "end": 8.56, + "confidence": 0.629 + } + ] + }, + { + "id": 1, + "seek": 0, + "start": 9.44, + "end": 12.74, + "text": " ist dann nicht so weitergegangen, wie sich Papst Benediktas gewünscht hatte.", + "tokens": [ + 50814, + 1418, + 3594, + 1979, + 370, + 8988, + 432, + 47152, + 11, + 3355, + 3041, + 15919, + 372, + 39753, + 9874, + 296, + 6906, + 3412, + 82, + 4701, + 13299, + 13, + 51014 + ], + "temperature": 0.0, + "avg_logprob": -0.28166988079364486, + "compression_ratio": 1.247191011235955, + "no_speech_prob": 0.2541781961917877, + "confidence": 0.889, + "words": [ + { + "text": "ist", + "start": 9.44, + "end": 9.66, + "confidence": 0.975 + }, + { + "text": "dann", + "start": 9.66, + "end": 9.82, + "confidence": 0.688 + }, + { + "text": "nicht", + "start": 9.82, + "end": 10.0, + "confidence": 0.996 + }, + { + "text": "so", + "start": 10.0, + "end": 10.16, + "confidence": 0.992 + }, + { + "text": "weitergegangen,", + "start": 10.16, + "end": 10.84, + "confidence": 0.811 + }, + { + "text": "wie", + "start": 10.9, + "end": 11.06, + "confidence": 0.988 + }, + { + "text": "sich", + "start": 11.06, + "end": 11.26, + "confidence": 0.964 + }, + { + "text": "Papst", + "start": 11.26, + "end": 11.56, + "confidence": 0.884 + }, + { + "text": "Benediktas", + "start": 11.56, + "end": 12.08, + "confidence": 0.764 + }, + { + "text": "gewünscht", + "start": 12.08, + "end": 12.56, + "confidence": 0.992 + }, + { + "text": "hatte.", + "start": 12.56, + "end": 12.74, + "confidence": 0.952 + } + ] + }, + { + "id": 2, + "seek": 0, + "start": 14.0, + "end": 15.48, + "text": " Das hat er als Emeritor so gemacht.", + "tokens": [ + 51014, + 2846, + 2385, + 1189, + 3907, + 18477, + 3029, + 370, + 12293, + 13, + 51114 + ], + "temperature": 0.0, + "avg_logprob": -0.28166988079364486, + "compression_ratio": 1.247191011235955, + "no_speech_prob": 0.2541781961917877, + "confidence": 0.442, + "words": [ + { + "text": "Das", + "start": 14.0, + "end": 14.2, + "confidence": 0.968 + }, + { + "text": "hat", + "start": 14.2, + "end": 14.36, + "confidence": 0.845 + }, + { + "text": "er", + "start": 14.36, + "end": 14.5, + "confidence": 0.99 + }, + { + "text": "als", + "start": 14.5, + "end": 14.7, + "confidence": 0.977 + }, + { + "text": "Emeritor", + "start": 14.7, + "end": 15.24, + "confidence": 0.429 + }, + { + "text": "so", + "start": 15.24, + "end": 15.42, + "confidence": 0.111 + }, + { + "text": "gemacht.", + "start": 15.42, + "end": 15.48, + "confidence": 0.09 + } + ] + } + ], + "language": "de", + "language_probs": { + "en": 0.006050508003681898, + "zh": 0.00035218181437812746, + "de": 0.9862326383590698, + "es": 0.0004315021797083318, + "ru": 0.0005806496483273804, + "ko": 0.0005627849022857845, + "fr": 0.0008188472711481154, + "ja": 0.0003577278694137931, + "pt": 0.0006683236570097506, + "tr": 0.0003577278694137931, + "pl": 0.0007455689483322203, + "ca": 1.2701659670710796e-06, + "nl": 0.0009877183474600315, + "ar": 0.00017434264009352773, + "sv": 5.3171497711446136e-05, + "it": 0.0005897935479879379, + "id": 1.8958882719743997e-05, + "hi": 5.2347153541632e-05, + "fi": 1.1145352800667752e-05, + "vi": 6.120002217357978e-05, + "he": 6.655193374172086e-06, + "uk": 7.903237928985618e-06, + "el": 4.013595389551483e-05, + "ms": 1.7810220015235245e-05, + "cs": 9.990628313971683e-06, + "ro": 1.673115730227437e-05, + "da": 4.945720320392866e-06, + "hu": 4.477489346754737e-05, + "ta": 1.7634508822084172e-06, + "no": 2.9532243388530333e-06, + "th": 4.076800178154372e-05, + "ur": 2.6321804398321547e-05, + "hr": 2.3131441651003115e-07, + "bg": 2.424154104119225e-07, + "lt": 1.8586635519568517e-07, + "la": 0.00021697291231248528, + "mi": 3.5070404464931926e-06, + "ml": 3.618366235969006e-06, + "cy": 4.013595389551483e-05, + "sk": 3.582667602586298e-07, + "te": 3.934790697712742e-07, + "fa": 3.0949524898460368e-06, + "lv": 4.3462691223794536e-08, + "bn": 5.131934699420526e-07, + "sr": 5.482659659605815e-09, + "az": 2.2903229535131686e-08, + "sl": 1.0206069873675006e-06, + "kn": 8.761265490875303e-09, + "et": 6.891269066500172e-08, + "mk": 1.5344205905876152e-09, + "br": 2.817986569425557e-06, + "eu": 2.207217590921573e-07, + "is": 1.3812415033953584e-07, + "hy": 1.4250868218823598e-07, + "ne": 1.2576346364312485e-07, + "mn": 3.1616932005817944e-07, + "bs": 4.7734424413192755e-08, + "kk": 7.320311024017201e-09, + "sq": 1.18820384642504e-08, + "sw": 2.621135593017243e-07, + "gl": 2.0941495222359663e-06, + "mr": 2.053031877835565e-08, + "pa": 3.776103696395694e-08, + "si": 6.487373411800945e-07, + "km": 2.396627314737998e-05, + "sn": 3.618366235969006e-06, + "yo": 2.2772820784666692e-07, + "so": 3.266969750281845e-10, + "af": 1.0264515282187858e-07, + "oc": 4.600236138685432e-07, + "ka": 1.333127719327365e-09, + "be": 2.7469266683510796e-07, + "tg": 2.060452086727338e-10, + "sd": 1.8547597235851754e-08, + "gu": 1.046383979463883e-09, + "am": 1.924594483782016e-09, + "yi": 2.704339294723468e-07, + "lo": 4.449337609457871e-08, + "uz": 1.6299518679208091e-10, + "fo": 7.870076501603762e-08, + "ht": 1.338745079237924e-07, + "ps": 6.945317920781235e-08, + "tk": 9.453291482941495e-10, + "nn": 0.00032066518906503916, + "mt": 1.4191070540903183e-09, + "sa": 3.2945599741651677e-06, + "lb": 7.837053783710246e-10, + "my": 1.2381367753278028e-07, + "bo": 6.784429729123076e-08, + "tl": 2.999730895680841e-06, + "mg": 1.046383979463883e-09, + "as": 1.685231287851252e-09, + "tt": 3.110817506368768e-11, + "haw": 7.195980288088322e-06, + "ln": 3.738849230217056e-09, + "ha": 3.8194747364883597e-10, + "ba": 9.306730386349216e-10, + "jw": 2.9826507670804858e-05, + "su": 2.2105424435370225e-10 + } +} \ No newline at end of file diff --git a/tests/expected/medium_auto/gloria.mp3.words.json b/tests/expected/medium_auto/gloria.mp3.words.json new file mode 100644 index 0000000000000000000000000000000000000000..666a4b26ecb2754eb9f31b9eaab69a53d7f7150a --- /dev/null +++ b/tests/expected/medium_auto/gloria.mp3.words.json @@ -0,0 +1,639 @@ +{ + "text": " Hello. How are you? Love. How are you? I'm okay. I will be. I said she could stay with us tomorrow, she feels better. Of course she can. This won't be for long. Well, you can stay as long as you want, my love. I really miss you.", + "segments": [ + { + "id": 0, + "seek": 0, + "start": 1.4, + "end": 1.74, + "text": " Hello.", + "tokens": [ + 50364, + 2425, + 13, + 50464 + ], + "temperature": 0.0, + "avg_logprob": -0.23879062428193934, + "compression_ratio": 1.4615384615384615, + "no_speech_prob": 0.05016394704580307, + "confidence": 0.285, + "words": [ + { + "text": "Hello.", + "start": 1.4, + "end": 1.74, + "confidence": 0.285 + } + ] + }, + { + "id": 1, + "seek": 0, + "start": 2.32, + "end": 3.5, + "text": " How are you?", + "tokens": [ + 50464, + 1012, + 366, + 291, + 30, + 50564 + ], + "temperature": 0.0, + "avg_logprob": -0.23879062428193934, + "compression_ratio": 1.4615384615384615, + "no_speech_prob": 0.05016394704580307, + "confidence": 0.786, + "words": [ + { + "text": "How", + "start": 2.32, + "end": 2.82, + "confidence": 0.551 + }, + { + "text": "are", + "start": 2.82, + "end": 3.24, + "confidence": 0.989 + }, + { + "text": "you?", + "start": 3.24, + "end": 3.5, + "confidence": 0.893 + } + ] + }, + { + "id": 2, + "seek": 0, + "start": 3.5, + "end": 4.26, + "text": " Love.", + "tokens": [ + 50564, + 5956, + 13, + 50664 + ], + "temperature": 0.0, + "avg_logprob": -0.23879062428193934, + "compression_ratio": 1.4615384615384615, + "no_speech_prob": 0.05016394704580307, + "confidence": 0.244, + "words": [ + { + "text": "Love.", + "start": 3.5, + "end": 4.26, + "confidence": 0.244 + } + ] + }, + { + "id": 3, + "seek": 0, + "start": 5.5, + "end": 6.38, + "text": " How are you?", + "tokens": [ + 50664, + 1012, + 366, + 291, + 30, + 50764 + ], + "temperature": 0.0, + "avg_logprob": -0.23879062428193934, + "compression_ratio": 1.4615384615384615, + "no_speech_prob": 0.05016394704580307, + "confidence": 0.926, + "words": [ + { + "text": "How", + "start": 5.5, + "end": 5.68, + "confidence": 0.851 + }, + { + "text": "are", + "start": 5.68, + "end": 6.08, + "confidence": 0.998 + }, + { + "text": "you?", + "start": 6.08, + "end": 6.38, + "confidence": 0.935 + } + ] + }, + { + "id": 4, + "seek": 0, + "start": 7.5, + "end": 9.18, + "text": " I'm okay. I will be.", + "tokens": [ + 50764, + 286, + 478, + 1392, + 13, + 286, + 486, + 312, + 13, + 50864 + ], + "temperature": 0.0, + "avg_logprob": -0.23879062428193934, + "compression_ratio": 1.4615384615384615, + "no_speech_prob": 0.05016394704580307, + "confidence": 0.77, + "words": [ + { + "text": "I'm", + "start": 7.5, + "end": 7.52, + "confidence": 0.767 + }, + { + "text": "okay.", + "start": 7.52, + "end": 8.22, + "confidence": 0.488 + }, + { + "text": "I", + "start": 8.42, + "end": 8.64, + "confidence": 0.767 + }, + { + "text": "will", + "start": 8.64, + "end": 8.94, + "confidence": 0.949 + }, + { + "text": "be.", + "start": 8.94, + "end": 9.18, + "confidence": 0.997 + } + ] + }, + { + "id": 5, + "seek": 0, + "start": 9.5, + "end": 11.52, + "text": " I said she could stay with us tomorrow, she feels better.", + "tokens": [ + 50864, + 286, + 848, + 750, + 727, + 1754, + 365, + 505, + 4153, + 11, + 750, + 3417, + 1101, + 13, + 50964 + ], + "temperature": 0.0, + "avg_logprob": -0.23879062428193934, + "compression_ratio": 1.4615384615384615, + "no_speech_prob": 0.05016394704580307, + "confidence": 0.786, + "words": [ + { + "text": "I", + "start": 9.5, + "end": 9.52, + "confidence": 0.883 + }, + { + "text": "said", + "start": 9.52, + "end": 9.64, + "confidence": 0.856 + }, + { + "text": "she", + "start": 9.64, + "end": 9.78, + "confidence": 0.928 + }, + { + "text": "could", + "start": 9.78, + "end": 9.96, + "confidence": 0.909 + }, + { + "text": "stay", + "start": 9.96, + "end": 10.16, + "confidence": 0.994 + }, + { + "text": "with", + "start": 10.16, + "end": 10.28, + "confidence": 0.977 + }, + { + "text": "us", + "start": 10.28, + "end": 10.46, + "confidence": 0.993 + }, + { + "text": "tomorrow,", + "start": 10.46, + "end": 10.66, + "confidence": 0.514 + }, + { + "text": "she", + "start": 10.72, + "end": 10.86, + "confidence": 0.279 + }, + { + "text": "feels", + "start": 10.86, + "end": 11.16, + "confidence": 0.809 + }, + { + "text": "better.", + "start": 11.16, + "end": 11.52, + "confidence": 0.992 + } + ] + }, + { + "id": 6, + "seek": 0, + "start": 12.06, + "end": 13.36, + "text": " Of course she can.", + "tokens": [ + 50964, + 2720, + 1164, + 750, + 393, + 13, + 51064 + ], + "temperature": 0.0, + "avg_logprob": -0.23879062428193934, + "compression_ratio": 1.4615384615384615, + "no_speech_prob": 0.05016394704580307, + "confidence": 0.928, + "words": [ + { + "text": "Of", + "start": 12.06, + "end": 12.34, + "confidence": 0.788 + }, + { + "text": "course", + "start": 12.34, + "end": 12.56, + "confidence": 0.989 + }, + { + "text": "she", + "start": 12.56, + "end": 12.88, + "confidence": 0.958 + }, + { + "text": "can.", + "start": 12.88, + "end": 13.36, + "confidence": 0.993 + } + ] + }, + { + "id": 7, + "seek": 0, + "start": 13.5, + "end": 15.26, + "text": " This won't be for long.", + "tokens": [ + 51064, + 639, + 1582, + 380, + 312, + 337, + 938, + 13, + 51164 + ], + "temperature": 0.0, + "avg_logprob": -0.23879062428193934, + "compression_ratio": 1.4615384615384615, + "no_speech_prob": 0.05016394704580307, + "confidence": 0.892, + "words": [ + { + "text": "This", + "start": 13.5, + "end": 14.28, + "confidence": 0.543 + }, + { + "text": "won't", + "start": 14.28, + "end": 14.6, + "confidence": 0.975 + }, + { + "text": "be", + "start": 14.6, + "end": 14.8, + "confidence": 0.996 + }, + { + "text": "for", + "start": 14.8, + "end": 14.96, + "confidence": 0.984 + }, + { + "text": "long.", + "start": 14.96, + "end": 15.26, + "confidence": 0.996 + } + ] + }, + { + "id": 8, + "seek": 0, + "start": 15.5, + "end": 17.62, + "text": " Well, you can stay as long as you want, my love.", + "tokens": [ + 51164, + 1042, + 11, + 291, + 393, + 1754, + 382, + 938, + 382, + 291, + 528, + 11, + 452, + 959, + 13, + 51264 + ], + "temperature": 0.0, + "avg_logprob": -0.23879062428193934, + "compression_ratio": 1.4615384615384615, + "no_speech_prob": 0.05016394704580307, + "confidence": 0.927, + "words": [ + { + "text": "Well,", + "start": 15.5, + "end": 15.56, + "confidence": 0.675 + }, + { + "text": "you", + "start": 15.68, + "end": 15.7, + "confidence": 0.744 + }, + { + "text": "can", + "start": 15.7, + "end": 15.94, + "confidence": 0.982 + }, + { + "text": "stay", + "start": 15.94, + "end": 16.14, + "confidence": 0.985 + }, + { + "text": "as", + "start": 16.14, + "end": 16.28, + "confidence": 0.972 + }, + { + "text": "long", + "start": 16.28, + "end": 16.4, + "confidence": 0.994 + }, + { + "text": "as", + "start": 16.4, + "end": 16.48, + "confidence": 0.996 + }, + { + "text": "you", + "start": 16.48, + "end": 16.62, + "confidence": 0.995 + }, + { + "text": "want,", + "start": 16.62, + "end": 16.8, + "confidence": 0.995 + }, + { + "text": "my", + "start": 16.88, + "end": 17.22, + "confidence": 0.95 + }, + { + "text": "love.", + "start": 17.22, + "end": 17.62, + "confidence": 0.993 + } + ] + }, + { + "id": 9, + "seek": 0, + "start": 17.76, + "end": 19.26, + "text": " I really miss you.", + "tokens": [ + 51264, + 286, + 534, + 1713, + 291, + 13, + 51364 + ], + "temperature": 0.0, + "avg_logprob": -0.23879062428193934, + "compression_ratio": 1.4615384615384615, + "no_speech_prob": 0.05016394704580307, + "confidence": 0.792, + "words": [ + { + "text": "I", + "start": 17.76, + "end": 17.98, + "confidence": 0.587 + }, + { + "text": "really", + "start": 17.98, + "end": 18.36, + "confidence": 0.944 + }, + { + "text": "miss", + "start": 18.36, + "end": 18.78, + "confidence": 0.905 + }, + { + "text": "you.", + "start": 18.78, + "end": 19.26, + "confidence": 0.787 + } + ] + } + ], + "language": "en", + "language_probs": { + "en": 0.7642066478729248, + "zh": 0.002470605308189988, + "de": 0.00040966656524688005, + "es": 0.0006444960017688572, + "ru": 0.0002904970897361636, + "ko": 0.0003848461201414466, + "fr": 0.0005512665957212448, + "ja": 0.00021587910305242985, + "pt": 0.0011135890381410718, + "tr": 0.0011135890381410718, + "pl": 0.0003396255197003484, + "ca": 8.587077900301665e-05, + "nl": 0.0008538184338249266, + "ar": 0.0006860623834654689, + "sv": 0.00031410224619321525, + "it": 0.00036152946995571256, + "id": 1.690895987849217e-05, + "hi": 3.751416443265043e-05, + "fi": 2.0396098989294842e-05, + "vi": 0.00011555175296962261, + "he": 7.386976903944742e-06, + "uk": 2.3475764464819804e-05, + "el": 0.00016552023589611053, + "ms": 0.00035592447966337204, + "cs": 1.0917243344010785e-05, + "ro": 6.029074484104058e-06, + "da": 3.993362042820081e-05, + "hu": 1.6134639736264944e-05, + "ta": 6.518983809655765e-06, + "no": 2.7020438210456632e-05, + "th": 9.730433521326631e-05, + "ur": 4.317853745305911e-05, + "hr": 7.314098411370651e-07, + "bg": 1.324411982750462e-06, + "lt": 3.9149543340499804e-07, + "la": 0.0018942790338769555, + "mi": 0.00033436008379794657, + "ml": 1.02558014987153e-05, + "cy": 0.21894888579845428, + "sk": 1.3742783266934566e-07, + "te": 3.772898935494595e-06, + "fa": 2.3475764464819804e-05, + "lv": 3.195292492819135e-07, + "bn": 2.1835862753505353e-06, + "sr": 2.107523933148059e-08, + "az": 2.7330784746482095e-07, + "sl": 1.4690757780044805e-05, + "kn": 2.7061142660045334e-08, + "et": 1.1939934552174236e-07, + "mk": 1.615894618112179e-08, + "br": 1.7720436517265625e-05, + "eu": 1.0476960596861318e-06, + "is": 1.690895987849217e-05, + "hy": 4.8241702188533964e-08, + "ne": 3.096983789419028e-07, + "mn": 1.244169880010304e-06, + "bs": 2.5528709102218272e-06, + "kk": 3.114718438723685e-08, + "sq": 5.520970489669708e-07, + "sw": 3.2779512366687413e-06, + "gl": 2.2753489247406833e-05, + "mr": 7.019126258001052e-08, + "pa": 4.299735962831619e-07, + "si": 1.324411982750462e-06, + "km": 7.008568354649469e-05, + "sn": 9.78615389612969e-06, + "yo": 8.772251931077335e-06, + "so": 4.851795409877013e-09, + "af": 9.050712833413854e-06, + "oc": 2.474327402524068e-06, + "ka": 3.6055483043639924e-09, + "be": 1.115266741180676e-06, + "tg": 6.181347877998178e-09, + "sd": 6.003777031082791e-08, + "gu": 4.8898485260906455e-09, + "am": 2.278776634057067e-08, + "yi": 7.200703180387791e-07, + "lo": 5.186471412343963e-07, + "uz": 6.935280127962073e-10, + "fo": 1.5727781601526658e-06, + "ht": 2.7603114176599775e-06, + "ps": 1.597545633558184e-06, + "tk": 4.417610277585027e-09, + "nn": 0.0033245631493628025, + "mt": 3.4013709182545426e-07, + "sa": 3.544309947756119e-06, + "lb": 8.188955291643651e-09, + "my": 1.6227033938776003e-06, + "bo": 2.2529004581883783e-06, + "tl": 5.9018060710513964e-05, + "mg": 1.6934430746573526e-08, + "as": 3.6414750326230205e-08, + "tt": 4.248373652870896e-09, + "haw": 8.999180136015639e-05, + "ln": 5.216171672373093e-08, + "ha": 2.0748498030798146e-08, + "ba": 6.038157085441753e-09, + "jw": 7.460582128260285e-05, + "su": 2.351112904364072e-08 + } +} \ No newline at end of file diff --git a/tests/expected/medium_auto/laugh1.mp3.words.json b/tests/expected/medium_auto/laugh1.mp3.words.json new file mode 100644 index 0000000000000000000000000000000000000000..e30d1c3b3056b4e837f39521078bdd7051707de7 --- /dev/null +++ b/tests/expected/medium_auto/laugh1.mp3.words.json @@ -0,0 +1,133 @@ +{ + "text": " hahahaha", + "segments": [ + { + "id": 0, + "seek": 0, + "start": 0.32, + "end": 1.58, + "text": " hahahaha", + "tokens": [ + 50364, + 17206, + 15380, + 50464 + ], + "temperature": 0.0, + "avg_logprob": -1.2670220375061034, + "compression_ratio": 0.6666666666666666, + "no_speech_prob": 0.5899588465690613, + "confidence": 0.135, + "words": [ + { + "text": "hahahaha", + "start": 0.32, + "end": 1.58, + "confidence": 0.135 + } + ] + } + ], + "language": "en", + "language_probs": { + "en": 0.45703765749931335, + "zh": 0.024991001933813095, + "de": 0.04668933525681496, + "es": 0.07231386005878448, + "ru": 0.03362906724214554, + "ko": 0.012179641053080559, + "fr": 0.03751593455672264, + "ja": 0.01074849534779787, + "pt": 0.059950292110443115, + "tr": 0.016135403886437416, + "pl": 0.02240178734064102, + "ca": 0.0015244607347995043, + "nl": 0.008636659011244774, + "ar": 0.03014490194618702, + "sv": 0.016647595912218094, + "it": 0.011441714130342007, + "id": 0.0012837247923016548, + "hi": 0.009786616079509258, + "fi": 0.0038324943743646145, + "vi": 0.004695670213550329, + "he": 0.0012249386636540294, + "uk": 0.0059358831495046616, + "el": 0.0043427846394479275, + "ms": 0.006318714469671249, + "cs": 0.009940733201801777, + "ro": 0.01108968909829855, + "da": 0.0026755118742585182, + "hu": 0.0022180776577442884, + "ta": 0.00039767936686985195, + "no": 0.0018972221296280622, + "th": 0.0018678084015846252, + "ur": 0.006418219767510891, + "hr": 0.0008551450446248055, + "bg": 0.0015244607347995043, + "lt": 0.00019381343736313283, + "la": 0.006418219767510891, + "mi": 0.002717645140364766, + "ml": 0.0003620911738835275, + "cy": 0.011441714130342007, + "sk": 0.0009539831662550569, + "te": 0.001754643744789064, + "fa": 0.0038324943743646145, + "lv": 0.0001683880400378257, + "bn": 0.0016227801097556949, + "sr": 6.491936801467091e-05, + "az": 2.314771518285852e-05, + "sl": 0.0014320984482765198, + "kn": 2.664285602804739e-05, + "et": 0.00013320590369403362, + "mk": 4.7496025217697024e-05, + "br": 0.0002819968794938177, + "eu": 0.0001908086269395426, + "is": 0.0002776249311864376, + "hy": 0.0001849380787461996, + "ne": 0.00011940499098272994, + "mn": 0.00012128534581279382, + "bs": 0.00033487958717159927, + "kk": 5.216418139752932e-05, + "sq": 0.00022659085516352206, + "sw": 0.002183689270168543, + "gl": 0.0008033344056457281, + "mr": 4.977541175321676e-05, + "pa": 0.00011043157428503036, + "si": 0.0010642451234161854, + "km": 0.001047745579853654, + "sn": 0.0018972221296280622, + "yo": 0.0003049113438464701, + "so": 1.163940214610193e-05, + "af": 9.899021097226068e-05, + "oc": 9.013162343762815e-05, + "ka": 3.114865467068739e-05, + "be": 0.00017646915512159467, + "tg": 5.412824521044968e-06, + "sd": 6.194649904500693e-05, + "gu": 1.3396869690041058e-05, + "am": 1.9190129023627378e-05, + "yi": 7.589843880850822e-05, + "lo": 0.0001533190516056493, + "uz": 3.150641703086876e-07, + "fo": 5.729114491259679e-05, + "ht": 9.013162343762815e-05, + "ps": 0.00047969285515137017, + "tk": 2.2564011032955023e-06, + "nn": 0.012965160422027111, + "mt": 1.6672673154971562e-05, + "sa": 0.00034550981945358217, + "lb": 1.2856585271947552e-06, + "my": 0.0001533190516056493, + "bo": 0.0001657774264458567, + "tl": 0.002116504358127713, + "mg": 5.584645805356558e-06, + "as": 1.831134795793332e-05, + "tt": 1.5267572734956047e-06, + "haw": 0.0009539831662550569, + "ln": 1.0934206329693552e-05, + "ha": 5.49806418348453e-06, + "ba": 2.2919341517990688e-06, + "jw": 0.003127990523353219, + "su": 4.8520246309635695e-06 + } +} \ No newline at end of file diff --git a/tests/expected/medium_auto/laugh2.mp3.words.json b/tests/expected/medium_auto/laugh2.mp3.words.json new file mode 100644 index 0000000000000000000000000000000000000000..cc5244c74d4ffa3d0eec81aaee4bf9803b9da83e --- /dev/null +++ b/tests/expected/medium_auto/laugh2.mp3.words.json @@ -0,0 +1,133 @@ +{ + "text": " Hehehe", + "segments": [ + { + "id": 0, + "seek": 0, + "start": 0.22, + "end": 0.64, + "text": " Hehehe", + "tokens": [ + 50364, + 634, + 23500, + 50464 + ], + "temperature": 0.0, + "avg_logprob": -1.0079832077026367, + "compression_ratio": 0.5, + "no_speech_prob": 0.3699853718280792, + "confidence": 0.334, + "words": [ + { + "text": "Hehehe", + "start": 0.22, + "end": 0.64, + "confidence": 0.334 + } + ] + } + ], + "language": "en", + "language_probs": { + "en": 0.6829636693000793, + "zh": 0.020623717457056046, + "de": 0.017097661271691322, + "es": 0.016832586377859116, + "ru": 0.02336973138153553, + "ko": 0.09388463199138641, + "fr": 0.014624404720962048, + "ja": 0.041015155613422394, + "pt": 0.01657162234187126, + "tr": 0.002581360749900341, + "pl": 0.0035283018369227648, + "ca": 0.00028962065698578954, + "nl": 0.0075870417058467865, + "ar": 0.003366729011759162, + "sv": 0.0032631459180265665, + "it": 0.0035838645417243242, + "id": 0.004898561630398035, + "hi": 0.004061050247400999, + "fi": 0.003065441967919469, + "vi": 0.002663301769644022, + "he": 0.0002516267995815724, + "uk": 0.0007872705464251339, + "el": 0.0005410826415754855, + "ms": 0.0037558579351752996, + "cs": 0.0009952031541615725, + "ro": 0.0006733882473781705, + "da": 0.00031808606581762433, + "hu": 0.0006131269037723541, + "ta": 0.00101087533403188, + "no": 0.0004020984342787415, + "th": 0.005214491859078407, + "ur": 0.0004020984342787415, + "hr": 0.00012073184188921005, + "bg": 8.8329310528934e-05, + "lt": 2.2684840587317012e-05, + "la": 0.0005163046298548579, + "mi": 0.0007872705464251339, + "ml": 0.0007057047332637012, + "cy": 0.001640812843106687, + "sk": 6.362121348502114e-05, + "te": 0.00036043874570168555, + "fa": 5.441810571937822e-05, + "lv": 1.4646435374743305e-05, + "bn": 5.7927773013943806e-05, + "sr": 1.9514486666594166e-06, + "az": 7.178978194133379e-07, + "sl": 0.00010654547804733738, + "kn": 2.1432470020954497e-06, + "et": 1.7123416910180822e-05, + "mk": 7.641982051609375e-07, + "br": 0.00010654547804733738, + "eu": 1.272504323424073e-05, + "is": 3.24945394822862e-05, + "hy": 8.345286914845929e-06, + "ne": 2.0334560758783482e-05, + "mn": 2.304207555425819e-05, + "bs": 1.088430690288078e-05, + "kk": 3.5336167911736993e-06, + "sq": 2.390964937148965e-06, + "sw": 0.0001265258906641975, + "gl": 8.8329310528934e-05, + "mr": 5.825949301652145e-06, + "pa": 2.751983856796869e-06, + "si": 0.0001456304162275046, + "km": 0.0007750650402158499, + "sn": 0.00042139552533626556, + "yo": 2.304207555425819e-05, + "so": 1.9935302475460048e-07, + "af": 1.1229812116653193e-05, + "oc": 9.309840606874786e-06, + "ka": 5.011734742765839e-07, + "be": 1.5111363609321415e-05, + "tg": 5.7563557476214555e-08, + "sd": 2.795321279336349e-06, + "gu": 5.951582124907873e-07, + "am": 1.1119018381577916e-06, + "yi": 4.262356014805846e-06, + "lo": 2.3773511202307418e-05, + "uz": 1.9585014499057252e-08, + "fo": 3.820750862360001e-06, + "ht": 7.138101864256896e-06, + "ps": 9.023407073982526e-06, + "tk": 1.7051567624548625e-07, + "nn": 0.007706519681960344, + "mt": 4.563236188914743e-07, + "sa": 3.798996112891473e-05, + "lb": 8.64131379785249e-08, + "my": 2.5306770112365484e-05, + "bo": 1.4419363651541062e-05, + "tl": 0.002663301769644022, + "mg": 4.286763726213394e-07, + "as": 7.406862891912169e-07, + "tt": 4.698200939401431e-08, + "haw": 0.0005326939281076193, + "ln": 4.6350965021701995e-07, + "ha": 3.087639868226688e-07, + "ba": 2.0249235888059047e-07, + "jw": 0.0017195570981130004, + "su": 6.045305553925573e-07 + } +} \ No newline at end of file diff --git a/tests/expected/medium_auto/punctuations.mp3.words.json b/tests/expected/medium_auto/punctuations.mp3.words.json new file mode 100644 index 0000000000000000000000000000000000000000..cf3491850620837ca929b3d250fdddf36252879e --- /dev/null +++ b/tests/expected/medium_auto/punctuations.mp3.words.json @@ -0,0 +1,169 @@ +{ + "text": " Dis-moi, est-ce que l'avion vole ?", + "segments": [ + { + "id": 0, + "seek": 0, + "start": 0.38, + "end": 2.76, + "text": " Dis-moi, est-ce que l'avion vole ?", + "tokens": [ + 50364, + 4208, + 12, + 29292, + 11, + 871, + 12, + 384, + 631, + 287, + 6, + 706, + 313, + 49877, + 2506, + 50496 + ], + "temperature": 0.0, + "avg_logprob": -0.26327380012063417, + "compression_ratio": 0.8095238095238095, + "no_speech_prob": 0.03882359713315964, + "confidence": 0.928, + "words": [ + { + "text": "Dis-moi,", + "start": 0.38, + "end": 1.1, + "confidence": 0.809 + }, + { + "text": "est-ce", + "start": 1.28, + "end": 1.5, + "confidence": 0.968 + }, + { + "text": "que", + "start": 1.5, + "end": 1.66, + "confidence": 0.978 + }, + { + "text": "l'avion", + "start": 1.66, + "end": 2.04, + "confidence": 0.993 + }, + { + "text": "vole ?", + "start": 2.04, + "end": 2.76, + "confidence": 0.898 + } + ] + } + ], + "language": "fr", + "language_probs": { + "en": 0.003270540852099657, + "zh": 0.00047116613131947815, + "de": 0.001078509958460927, + "es": 0.0011845114640891552, + "ru": 0.00093702576123178, + "ko": 0.0007529213326051831, + "fr": 0.9805174469947815, + "ja": 0.001148067880421877, + "pt": 0.0008141020080074668, + "tr": 0.00018451130017638206, + "pl": 0.000586375710554421, + "ca": 1.4227982319425792e-05, + "nl": 0.001078509958460927, + "ar": 0.00047116613131947815, + "sv": 9.133971616392955e-05, + "it": 0.0027540717273950577, + "id": 5.540033816942014e-05, + "hi": 4.88906262035016e-05, + "fi": 4.966054257238284e-05, + "vi": 5.8059056755155325e-05, + "he": 0.00010513137385714799, + "uk": 1.743249231367372e-05, + "el": 0.00029027703567408025, + "ms": 0.00015296523633878678, + "cs": 7.691574865020812e-05, + "ro": 0.00010846859368029982, + "da": 4.14057922171196e-06, + "hu": 7.0032590883784e-05, + "ta": 3.7700406210205983e-06, + "no": 5.234182481217431e-06, + "th": 4.966054257238284e-05, + "ur": 9.627135113987606e-06, + "hr": 9.330939064966515e-06, + "bg": 1.0409415153844748e-05, + "lt": 3.3987944902946765e-07, + "la": 0.0007412483682855964, + "mi": 1.7985856175073422e-05, + "ml": 7.195247917479719e-07, + "cy": 0.00010846859368029982, + "sk": 3.029312438229681e-06, + "te": 1.0633887086441973e-06, + "fa": 1.1795412319770548e-05, + "lv": 2.6886678483606374e-07, + "bn": 6.654516369053454e-07, + "sr": 7.124260292812323e-08, + "az": 1.4848232865460886e-07, + "sl": 1.3365954146138392e-05, + "kn": 2.600472903679929e-08, + "et": 6.865753903184668e-07, + "mk": 1.4848232865460886e-07, + "br": 0.0006049892399460077, + "eu": 5.839152890985133e-06, + "is": 3.094637577305548e-07, + "hy": 5.10219479110674e-07, + "ne": 1.3103519336254976e-07, + "mn": 8.679125471644511e-07, + "bs": 1.8956951635118457e-06, + "kk": 9.005908907511184e-08, + "sq": 8.59349853499225e-08, + "sw": 6.3136294556898065e-06, + "gl": 2.742515607678797e-05, + "mr": 1.330987089431801e-07, + "pa": 5.635753907995422e-08, + "si": 2.1819321318616858e-06, + "km": 0.00010846859368029982, + "sn": 5.7158933486789465e-05, + "yo": 4.5475362639990635e-06, + "so": 6.225109316915223e-09, + "af": 3.452317969276919e-07, + "oc": 9.423914889339358e-05, + "ka": 3.8432503401963913e-08, + "be": 4.917059413855895e-06, + "tg": 6.944611108394838e-09, + "sd": 2.5655444346739387e-07, + "gu": 3.01660172397078e-08, + "am": 6.141496555756021e-08, + "yi": 5.347054070625745e-07, + "lo": 9.238881375495112e-07, + "uz": 3.49196982440958e-09, + "fo": 1.936574705041494e-07, + "ht": 8.629708645457868e-06, + "ps": 6.059006523173593e-07, + "tk": 2.6414245013484106e-08, + "nn": 0.0012221119832247496, + "mt": 3.6672549441618685e-08, + "sa": 8.495916517858859e-06, + "lb": 2.2770503704805378e-08, + "my": 1.323408582720731e-06, + "bo": 5.264155902295897e-07, + "tl": 2.6169269403908402e-05, + "mg": 6.692623344406456e-08, + "as": 1.6659257084938872e-08, + "tt": 3.0576710052798717e-09, + "haw": 5.4541436838917434e-05, + "ln": 2.049735257969587e-06, + "ha": 2.041134550267998e-08, + "ba": 3.088138456064371e-08, + "jw": 0.0003727230941876769, + "su": 1.4028500139318112e-08 + } +} \ No newline at end of file diff --git a/tests/expected/medium_auto/radio_short.mp3.words.json b/tests/expected/medium_auto/radio_short.mp3.words.json new file mode 100644 index 0000000000000000000000000000000000000000..18b4b928cb799372f99eeaa6990b0375bcbcb839 --- /dev/null +++ b/tests/expected/medium_auto/radio_short.mp3.words.json @@ -0,0 +1,1632 @@ +{ + "text": "3212122222222211111111111111111111111111111111111111111111111", + "segments": [ + { + "id": 0, + "seek": 0, + "start": 0.04, + "end": 0.7, + "text": "3", + "tokens": [ + 50364, + 18, + 50464 + ], + "temperature": 0.0, + "avg_logprob": -0.284898887981068, + "compression_ratio": 1.0, + "no_speech_prob": 0.8409799933433533, + "confidence": 0.029, + "words": [ + { + "text": "3", + "start": 0.04, + "end": 0.7, + "confidence": 0.029 + } + ] + }, + { + "id": 1, + "seek": 0, + "start": 1.96, + "end": 3.02, + "text": "2", + "tokens": [ + 50464, + 17, + 50564 + ], + "temperature": 0.0, + "avg_logprob": -0.284898887981068, + "compression_ratio": 1.0, + "no_speech_prob": 0.8409799933433533, + "confidence": 0.691, + "words": [ + { + "text": "2", + "start": 1.96, + "end": 3.02, + "confidence": 0.691 + } + ] + }, + { + "id": 2, + "seek": 0, + "start": 3.72, + "end": 4.92, + "text": "1", + "tokens": [ + 50564, + 16, + 50664 + ], + "temperature": 0.0, + "avg_logprob": -0.284898887981068, + "compression_ratio": 1.0, + "no_speech_prob": 0.8409799933433533, + "confidence": 0.949, + "words": [ + { + "text": "1", + "start": 3.72, + "end": 4.92, + "confidence": 0.949 + } + ] + }, + { + "id": 3, + "seek": 0, + "start": 5.5, + "end": 7.08, + "text": "2", + "tokens": [ + 50664, + 17, + 50764 + ], + "temperature": 0.0, + "avg_logprob": -0.284898887981068, + "compression_ratio": 1.0, + "no_speech_prob": 0.8409799933433533, + "confidence": 0.278, + "words": [ + { + "text": "2", + "start": 5.5, + "end": 7.08, + "confidence": 0.278 + } + ] + }, + { + "id": 4, + "seek": 0, + "start": 8.46, + "end": 9.34, + "text": "1", + "tokens": [ + 50764, + 16, + 50864 + ], + "temperature": 0.0, + "avg_logprob": -0.284898887981068, + "compression_ratio": 1.0, + "no_speech_prob": 0.8409799933433533, + "confidence": 0.702, + "words": [ + { + "text": "1", + "start": 8.46, + "end": 9.34, + "confidence": 0.702 + } + ] + }, + { + "id": 5, + "seek": 0, + "start": 9.78, + "end": 11.34, + "text": "2", + "tokens": [ + 50864, + 17, + 50964 + ], + "temperature": 0.0, + "avg_logprob": -0.284898887981068, + "compression_ratio": 1.0, + "no_speech_prob": 0.8409799933433533, + "confidence": 0.919, + "words": [ + { + "text": "2", + "start": 9.78, + "end": 11.34, + "confidence": 0.919 + } + ] + }, + { + "id": 6, + "seek": 0, + "start": 11.8, + "end": 13.4, + "text": "2", + "tokens": [ + 50964, + 17, + 51064 + ], + "temperature": 0.0, + "avg_logprob": -0.284898887981068, + "compression_ratio": 1.0, + "no_speech_prob": 0.8409799933433533, + "confidence": 0.657, + "words": [ + { + "text": "2", + "start": 11.8, + "end": 13.4, + "confidence": 0.657 + } + ] + }, + { + "id": 7, + "seek": 0, + "start": 13.68, + "end": 15.54, + "text": "2", + "tokens": [ + 51064, + 17, + 51164 + ], + "temperature": 0.0, + "avg_logprob": -0.284898887981068, + "compression_ratio": 1.0, + "no_speech_prob": 0.8409799933433533, + "confidence": 0.773, + "words": [ + { + "text": "2", + "start": 13.68, + "end": 15.54, + "confidence": 0.773 + } + ] + }, + { + "id": 8, + "seek": 0, + "start": 15.54, + "end": 17.2, + "text": "2", + "tokens": [ + 51164, + 17, + 51264 + ], + "temperature": 0.0, + "avg_logprob": -0.284898887981068, + "compression_ratio": 1.0, + "no_speech_prob": 0.8409799933433533, + "confidence": 0.905, + "words": [ + { + "text": "2", + "start": 15.54, + "end": 17.2, + "confidence": 0.905 + } + ] + }, + { + "id": 9, + "seek": 0, + "start": 17.5, + "end": 19.24, + "text": "2", + "tokens": [ + 51264, + 17, + 51364 + ], + "temperature": 0.0, + "avg_logprob": -0.284898887981068, + "compression_ratio": 1.0, + "no_speech_prob": 0.8409799933433533, + "confidence": 0.809, + "words": [ + { + "text": "2", + "start": 17.5, + "end": 19.24, + "confidence": 0.809 + } + ] + }, + { + "id": 10, + "seek": 0, + "start": 19.64, + "end": 20.8, + "text": "2", + "tokens": [ + 51364, + 17, + 51464 + ], + "temperature": 0.0, + "avg_logprob": -0.284898887981068, + "compression_ratio": 1.0, + "no_speech_prob": 0.8409799933433533, + "confidence": 0.626, + "words": [ + { + "text": "2", + "start": 19.64, + "end": 20.8, + "confidence": 0.626 + } + ] + }, + { + "id": 11, + "seek": 0, + "start": 22.06, + "end": 22.9, + "text": "2", + "tokens": [ + 51464, + 17, + 51564 + ], + "temperature": 0.0, + "avg_logprob": -0.284898887981068, + "compression_ratio": 1.0, + "no_speech_prob": 0.8409799933433533, + "confidence": 0.834, + "words": [ + { + "text": "2", + "start": 22.06, + "end": 22.9, + "confidence": 0.834 + } + ] + }, + { + "id": 12, + "seek": 0, + "start": 23.56, + "end": 25.08, + "text": "2", + "tokens": [ + 51564, + 17, + 51664 + ], + "temperature": 0.0, + "avg_logprob": -0.284898887981068, + "compression_ratio": 1.0, + "no_speech_prob": 0.8409799933433533, + "confidence": 0.974, + "words": [ + { + "text": "2", + "start": 23.56, + "end": 25.08, + "confidence": 0.974 + } + ] + }, + { + "id": 13, + "seek": 0, + "start": 26.48, + "end": 27.08, + "text": "2", + "tokens": [ + 51664, + 17, + 51764 + ], + "temperature": 0.0, + "avg_logprob": -0.284898887981068, + "compression_ratio": 1.0, + "no_speech_prob": 0.8409799933433533, + "confidence": 0.971, + "words": [ + { + "text": "2", + "start": 26.48, + "end": 27.08, + "confidence": 0.971 + } + ] + }, + { + "id": 14, + "seek": 2800, + "start": 28.12, + "end": 29.62, + "text": "1", + "tokens": [ + 50364, + 16, + 50464 + ], + "temperature": 0.0, + "avg_logprob": -0.11499140479347923, + "compression_ratio": 1.2727272727272727, + "no_speech_prob": 0.18292438983917236, + "confidence": 0.316, + "words": [ + { + "text": "1", + "start": 28.12, + "end": 29.62, + "confidence": 0.316 + } + ] + }, + { + "id": 15, + "seek": 2800, + "start": 30.84, + "end": 31.14, + "text": "1", + "tokens": [ + 50464, + 16, + 50564 + ], + "temperature": 0.0, + "avg_logprob": -0.11499140479347923, + "compression_ratio": 1.2727272727272727, + "no_speech_prob": 0.18292438983917236, + "confidence": 0.545, + "words": [ + { + "text": "1", + "start": 30.84, + "end": 31.14, + "confidence": 0.545 + } + ] + }, + { + "id": 16, + "seek": 2800, + "start": 32.06, + "end": 33.18, + "text": "1", + "tokens": [ + 50564, + 16, + 50664 + ], + "temperature": 0.0, + "avg_logprob": -0.11499140479347923, + "compression_ratio": 1.2727272727272727, + "no_speech_prob": 0.18292438983917236, + "confidence": 0.913, + "words": [ + { + "text": "1", + "start": 32.06, + "end": 33.18, + "confidence": 0.913 + } + ] + }, + { + "id": 17, + "seek": 2800, + "start": 33.5, + "end": 35.1, + "text": "1", + "tokens": [ + 50664, + 16, + 50764 + ], + "temperature": 0.0, + "avg_logprob": -0.11499140479347923, + "compression_ratio": 1.2727272727272727, + "no_speech_prob": 0.18292438983917236, + "confidence": 0.887, + "words": [ + { + "text": "1", + "start": 33.5, + "end": 35.1, + "confidence": 0.887 + } + ] + }, + { + "id": 18, + "seek": 2800, + "start": 36.18, + "end": 36.64, + "text": "1", + "tokens": [ + 50764, + 16, + 50864 + ], + "temperature": 0.0, + "avg_logprob": -0.11499140479347923, + "compression_ratio": 1.2727272727272727, + "no_speech_prob": 0.18292438983917236, + "confidence": 0.957, + "words": [ + { + "text": "1", + "start": 36.18, + "end": 36.64, + "confidence": 0.957 + } + ] + }, + { + "id": 19, + "seek": 2800, + "start": 37.5, + "end": 38.46, + "text": "1", + "tokens": [ + 50864, + 16, + 50964 + ], + "temperature": 0.0, + "avg_logprob": -0.11499140479347923, + "compression_ratio": 1.2727272727272727, + "no_speech_prob": 0.18292438983917236, + "confidence": 0.958, + "words": [ + { + "text": "1", + "start": 37.5, + "end": 38.46, + "confidence": 0.958 + } + ] + }, + { + "id": 20, + "seek": 2800, + "start": 39.5, + "end": 41.14, + "text": "1", + "tokens": [ + 50964, + 16, + 51064 + ], + "temperature": 0.0, + "avg_logprob": -0.11499140479347923, + "compression_ratio": 1.2727272727272727, + "no_speech_prob": 0.18292438983917236, + "confidence": 0.966, + "words": [ + { + "text": "1", + "start": 39.5, + "end": 41.14, + "confidence": 0.966 + } + ] + }, + { + "id": 21, + "seek": 2800, + "start": 41.5, + "end": 43.38, + "text": "1", + "tokens": [ + 51064, + 16, + 51164 + ], + "temperature": 0.0, + "avg_logprob": -0.11499140479347923, + "compression_ratio": 1.2727272727272727, + "no_speech_prob": 0.18292438983917236, + "confidence": 0.973, + "words": [ + { + "text": "1", + "start": 41.5, + "end": 43.38, + "confidence": 0.973 + } + ] + }, + { + "id": 22, + "seek": 2800, + "start": 43.88, + "end": 44.68, + "text": "1", + "tokens": [ + 51164, + 16, + 51264 + ], + "temperature": 0.0, + "avg_logprob": -0.11499140479347923, + "compression_ratio": 1.2727272727272727, + "no_speech_prob": 0.18292438983917236, + "confidence": 0.946, + "words": [ + { + "text": "1", + "start": 43.88, + "end": 44.68, + "confidence": 0.946 + } + ] + }, + { + "id": 23, + "seek": 2800, + "start": 45.5, + "end": 47.16, + "text": "1", + "tokens": [ + 51264, + 16, + 51364 + ], + "temperature": 0.0, + "avg_logprob": -0.11499140479347923, + "compression_ratio": 1.2727272727272727, + "no_speech_prob": 0.18292438983917236, + "confidence": 0.96, + "words": [ + { + "text": "1", + "start": 45.5, + "end": 47.16, + "confidence": 0.96 + } + ] + }, + { + "id": 24, + "seek": 2800, + "start": 47.94, + "end": 48.8, + "text": "1", + "tokens": [ + 51364, + 16, + 51464 + ], + "temperature": 0.0, + "avg_logprob": -0.11499140479347923, + "compression_ratio": 1.2727272727272727, + "no_speech_prob": 0.18292438983917236, + "confidence": 0.965, + "words": [ + { + "text": "1", + "start": 47.94, + "end": 48.8, + "confidence": 0.965 + } + ] + }, + { + "id": 25, + "seek": 2800, + "start": 50.22, + "end": 50.96, + "text": "1", + "tokens": [ + 51464, + 16, + 51564 + ], + "temperature": 0.0, + "avg_logprob": -0.11499140479347923, + "compression_ratio": 1.2727272727272727, + "no_speech_prob": 0.18292438983917236, + "confidence": 0.967, + "words": [ + { + "text": "1", + "start": 50.22, + "end": 50.96, + "confidence": 0.967 + } + ] + }, + { + "id": 26, + "seek": 2800, + "start": 52.22, + "end": 52.84, + "text": "1", + "tokens": [ + 51564, + 16, + 51664 + ], + "temperature": 0.0, + "avg_logprob": -0.11499140479347923, + "compression_ratio": 1.2727272727272727, + "no_speech_prob": 0.18292438983917236, + "confidence": 0.963, + "words": [ + { + "text": "1", + "start": 52.22, + "end": 52.84, + "confidence": 0.963 + } + ] + }, + { + "id": 27, + "seek": 2800, + "start": 53.5, + "end": 54.78, + "text": "1", + "tokens": [ + 51664, + 16, + 51764 + ], + "temperature": 0.0, + "avg_logprob": -0.11499140479347923, + "compression_ratio": 1.2727272727272727, + "no_speech_prob": 0.18292438983917236, + "confidence": 0.945, + "words": [ + { + "text": "1", + "start": 53.5, + "end": 54.78, + "confidence": 0.945 + } + ] + }, + { + "id": 28, + "seek": 5600, + "start": 56.56, + "end": 57.24, + "text": "1", + "tokens": [ + 50364, + 16, + 50464 + ], + "temperature": 0.0, + "avg_logprob": -0.1206196438182484, + "compression_ratio": 1.2727272727272727, + "no_speech_prob": 0.1875864416360855, + "confidence": 0.425, + "words": [ + { + "text": "1", + "start": 56.56, + "end": 57.24, + "confidence": 0.425 + } + ] + }, + { + "id": 29, + "seek": 5600, + "start": 57.64, + "end": 58.86, + "text": "1", + "tokens": [ + 50464, + 16, + 50564 + ], + "temperature": 0.0, + "avg_logprob": -0.1206196438182484, + "compression_ratio": 1.2727272727272727, + "no_speech_prob": 0.1875864416360855, + "confidence": 0.789, + "words": [ + { + "text": "1", + "start": 57.64, + "end": 58.86, + "confidence": 0.789 + } + ] + }, + { + "id": 30, + "seek": 5600, + "start": 60.08, + "end": 60.92, + "text": "1", + "tokens": [ + 50564, + 16, + 50664 + ], + "temperature": 0.0, + "avg_logprob": -0.1206196438182484, + "compression_ratio": 1.2727272727272727, + "no_speech_prob": 0.1875864416360855, + "confidence": 0.953, + "words": [ + { + "text": "1", + "start": 60.08, + "end": 60.92, + "confidence": 0.953 + } + ] + }, + { + "id": 31, + "seek": 5600, + "start": 61.5, + "end": 62.62, + "text": "1", + "tokens": [ + 50664, + 16, + 50764 + ], + "temperature": 0.0, + "avg_logprob": -0.1206196438182484, + "compression_ratio": 1.2727272727272727, + "no_speech_prob": 0.1875864416360855, + "confidence": 0.949, + "words": [ + { + "text": "1", + "start": 61.5, + "end": 62.62, + "confidence": 0.949 + } + ] + }, + { + "id": 32, + "seek": 5600, + "start": 64.36, + "end": 65.06, + "text": "1", + "tokens": [ + 50764, + 16, + 50864 + ], + "temperature": 0.0, + "avg_logprob": -0.1206196438182484, + "compression_ratio": 1.2727272727272727, + "no_speech_prob": 0.1875864416360855, + "confidence": 0.954, + "words": [ + { + "text": "1", + "start": 64.36, + "end": 65.06, + "confidence": 0.954 + } + ] + }, + { + "id": 33, + "seek": 5600, + "start": 65.5, + "end": 66.92, + "text": "1", + "tokens": [ + 50864, + 16, + 50964 + ], + "temperature": 0.0, + "avg_logprob": -0.1206196438182484, + "compression_ratio": 1.2727272727272727, + "no_speech_prob": 0.1875864416360855, + "confidence": 0.952, + "words": [ + { + "text": "1", + "start": 65.5, + "end": 66.92, + "confidence": 0.952 + } + ] + }, + { + "id": 34, + "seek": 5600, + "start": 67.96, + "end": 69.06, + "text": "1", + "tokens": [ + 50964, + 16, + 51064 + ], + "temperature": 0.0, + "avg_logprob": -0.1206196438182484, + "compression_ratio": 1.2727272727272727, + "no_speech_prob": 0.1875864416360855, + "confidence": 0.965, + "words": [ + { + "text": "1", + "start": 67.96, + "end": 69.06, + "confidence": 0.965 + } + ] + }, + { + "id": 35, + "seek": 5600, + "start": 70.38, + "end": 71.69, + "text": "1", + "tokens": [ + 51064, + 16, + 51164 + ], + "temperature": 0.0, + "avg_logprob": -0.1206196438182484, + "compression_ratio": 1.2727272727272727, + "no_speech_prob": 0.1875864416360855, + "confidence": 0.956, + "words": [ + { + "text": "1", + "start": 70.38, + "end": 71.69, + "confidence": 0.956 + } + ] + }, + { + "id": 36, + "seek": 5600, + "start": 71.69, + "end": 73.56, + "text": "1", + "tokens": [ + 51164, + 16, + 51264 + ], + "temperature": 0.0, + "avg_logprob": -0.1206196438182484, + "compression_ratio": 1.2727272727272727, + "no_speech_prob": 0.1875864416360855, + "confidence": 0.957, + "words": [ + { + "text": "1", + "start": 71.69, + "end": 73.56, + "confidence": 0.957 + } + ] + }, + { + "id": 37, + "seek": 5600, + "start": 73.56, + "end": 75.34, + "text": "1", + "tokens": [ + 51264, + 16, + 51364 + ], + "temperature": 0.0, + "avg_logprob": -0.1206196438182484, + "compression_ratio": 1.2727272727272727, + "no_speech_prob": 0.1875864416360855, + "confidence": 0.955, + "words": [ + { + "text": "1", + "start": 73.56, + "end": 75.34, + "confidence": 0.955 + } + ] + }, + { + "id": 38, + "seek": 5600, + "start": 75.5, + "end": 76.42, + "text": "1", + "tokens": [ + 51364, + 16, + 51464 + ], + "temperature": 0.0, + "avg_logprob": -0.1206196438182484, + "compression_ratio": 1.2727272727272727, + "no_speech_prob": 0.1875864416360855, + "confidence": 0.939, + "words": [ + { + "text": "1", + "start": 75.5, + "end": 76.42, + "confidence": 0.939 + } + ] + }, + { + "id": 39, + "seek": 5600, + "start": 78.14, + "end": 78.78, + "text": "1", + "tokens": [ + 51464, + 16, + 51564 + ], + "temperature": 0.0, + "avg_logprob": -0.1206196438182484, + "compression_ratio": 1.2727272727272727, + "no_speech_prob": 0.1875864416360855, + "confidence": 0.936, + "words": [ + { + "text": "1", + "start": 78.14, + "end": 78.78, + "confidence": 0.936 + } + ] + }, + { + "id": 40, + "seek": 5600, + "start": 80.08, + "end": 80.86, + "text": "1", + "tokens": [ + 51564, + 16, + 51664 + ], + "temperature": 0.0, + "avg_logprob": -0.1206196438182484, + "compression_ratio": 1.2727272727272727, + "no_speech_prob": 0.1875864416360855, + "confidence": 0.922, + "words": [ + { + "text": "1", + "start": 80.08, + "end": 80.86, + "confidence": 0.922 + } + ] + }, + { + "id": 41, + "seek": 5600, + "start": 81.5, + "end": 82.84, + "text": "1", + "tokens": [ + 51664, + 16, + 51764 + ], + "temperature": 0.0, + "avg_logprob": -0.1206196438182484, + "compression_ratio": 1.2727272727272727, + "no_speech_prob": 0.1875864416360855, + "confidence": 0.896, + "words": [ + { + "text": "1", + "start": 81.5, + "end": 82.84, + "confidence": 0.896 + } + ] + }, + { + "id": 42, + "seek": 8400, + "start": 84.82, + "end": 85.6, + "text": "1", + "tokens": [ + 50364, + 16, + 50464 + ], + "temperature": 0.0, + "avg_logprob": -0.10664921457117255, + "compression_ratio": 1.2727272727272727, + "no_speech_prob": 0.1820167452096939, + "confidence": 0.793, + "words": [ + { + "text": "1", + "start": 84.82, + "end": 85.6, + "confidence": 0.793 + } + ] + }, + { + "id": 43, + "seek": 8400, + "start": 85.6, + "end": 86.8, + "text": "1", + "tokens": [ + 50464, + 16, + 50564 + ], + "temperature": 0.0, + "avg_logprob": -0.10664921457117255, + "compression_ratio": 1.2727272727272727, + "no_speech_prob": 0.1820167452096939, + "confidence": 0.88, + "words": [ + { + "text": "1", + "start": 85.6, + "end": 86.8, + "confidence": 0.88 + } + ] + }, + { + "id": 44, + "seek": 8400, + "start": 87.76, + "end": 88.72, + "text": "1", + "tokens": [ + 50564, + 16, + 50664 + ], + "temperature": 0.0, + "avg_logprob": -0.10664921457117255, + "compression_ratio": 1.2727272727272727, + "no_speech_prob": 0.1820167452096939, + "confidence": 0.954, + "words": [ + { + "text": "1", + "start": 87.76, + "end": 88.72, + "confidence": 0.954 + } + ] + }, + { + "id": 45, + "seek": 8400, + "start": 89.5, + "end": 90.52, + "text": "1", + "tokens": [ + 50664, + 16, + 50764 + ], + "temperature": 0.0, + "avg_logprob": -0.10664921457117255, + "compression_ratio": 1.2727272727272727, + "no_speech_prob": 0.1820167452096939, + "confidence": 0.951, + "words": [ + { + "text": "1", + "start": 89.5, + "end": 90.52, + "confidence": 0.951 + } + ] + }, + { + "id": 46, + "seek": 8400, + "start": 91.5, + "end": 93.02, + "text": "1", + "tokens": [ + 50764, + 16, + 50864 + ], + "temperature": 0.0, + "avg_logprob": -0.10664921457117255, + "compression_ratio": 1.2727272727272727, + "no_speech_prob": 0.1820167452096939, + "confidence": 0.91, + "words": [ + { + "text": "1", + "start": 91.5, + "end": 93.02, + "confidence": 0.91 + } + ] + }, + { + "id": 47, + "seek": 8400, + "start": 93.68, + "end": 95.36, + "text": "1", + "tokens": [ + 50864, + 16, + 50964 + ], + "temperature": 0.0, + "avg_logprob": -0.10664921457117255, + "compression_ratio": 1.2727272727272727, + "no_speech_prob": 0.1820167452096939, + "confidence": 0.944, + "words": [ + { + "text": "1", + "start": 93.68, + "end": 95.36, + "confidence": 0.944 + } + ] + }, + { + "id": 48, + "seek": 8400, + "start": 95.86, + "end": 97.84, + "text": "1", + "tokens": [ + 50964, + 16, + 51064 + ], + "temperature": 0.0, + "avg_logprob": -0.10664921457117255, + "compression_ratio": 1.2727272727272727, + "no_speech_prob": 0.1820167452096939, + "confidence": 0.967, + "words": [ + { + "text": "1", + "start": 95.86, + "end": 97.84, + "confidence": 0.967 + } + ] + }, + { + "id": 49, + "seek": 8400, + "start": 97.84, + "end": 98.98, + "text": "1", + "tokens": [ + 51064, + 16, + 51164 + ], + "temperature": 0.0, + "avg_logprob": -0.10664921457117255, + "compression_ratio": 1.2727272727272727, + "no_speech_prob": 0.1820167452096939, + "confidence": 0.976, + "words": [ + { + "text": "1", + "start": 97.84, + "end": 98.98, + "confidence": 0.976 + } + ] + }, + { + "id": 50, + "seek": 8400, + "start": 99.5, + "end": 101.1, + "text": "1", + "tokens": [ + 51164, + 16, + 51264 + ], + "temperature": 0.0, + "avg_logprob": -0.10664921457117255, + "compression_ratio": 1.2727272727272727, + "no_speech_prob": 0.1820167452096939, + "confidence": 0.981, + "words": [ + { + "text": "1", + "start": 99.5, + "end": 101.1, + "confidence": 0.981 + } + ] + }, + { + "id": 51, + "seek": 8400, + "start": 101.5, + "end": 103.48, + "text": "1", + "tokens": [ + 51264, + 16, + 51364 + ], + "temperature": 0.0, + "avg_logprob": -0.10664921457117255, + "compression_ratio": 1.2727272727272727, + "no_speech_prob": 0.1820167452096939, + "confidence": 0.985, + "words": [ + { + "text": "1", + "start": 101.5, + "end": 103.48, + "confidence": 0.985 + } + ] + }, + { + "id": 52, + "seek": 8400, + "start": 103.5, + "end": 105.44, + "text": "1", + "tokens": [ + 51364, + 16, + 51464 + ], + "temperature": 0.0, + "avg_logprob": -0.10664921457117255, + "compression_ratio": 1.2727272727272727, + "no_speech_prob": 0.1820167452096939, + "confidence": 0.987, + "words": [ + { + "text": "1", + "start": 103.5, + "end": 105.44, + "confidence": 0.987 + } + ] + }, + { + "id": 53, + "seek": 8400, + "start": 105.58, + "end": 107.08, + "text": "1", + "tokens": [ + 51464, + 16, + 51564 + ], + "temperature": 0.0, + "avg_logprob": -0.10664921457117255, + "compression_ratio": 1.2727272727272727, + "no_speech_prob": 0.1820167452096939, + "confidence": 0.956, + "words": [ + { + "text": "1", + "start": 105.58, + "end": 107.08, + "confidence": 0.956 + } + ] + }, + { + "id": 54, + "seek": 8400, + "start": 108.32, + "end": 108.98, + "text": "1", + "tokens": [ + 51564, + 16, + 51664 + ], + "temperature": 0.0, + "avg_logprob": -0.10664921457117255, + "compression_ratio": 1.2727272727272727, + "no_speech_prob": 0.1820167452096939, + "confidence": 0.946, + "words": [ + { + "text": "1", + "start": 108.32, + "end": 108.98, + "confidence": 0.946 + } + ] + }, + { + "id": 55, + "seek": 8400, + "start": 109.5, + "end": 110.4, + "text": "1", + "tokens": [ + 51664, + 16, + 51764 + ], + "temperature": 0.0, + "avg_logprob": -0.10664921457117255, + "compression_ratio": 1.2727272727272727, + "no_speech_prob": 0.1820167452096939, + "confidence": 0.888, + "words": [ + { + "text": "1", + "start": 109.5, + "end": 110.4, + "confidence": 0.888 + } + ] + }, + { + "id": 56, + "seek": 11200, + "start": 112.66, + "end": 113.32, + "text": "1", + "tokens": [ + 50364, + 16, + 50464 + ], + "temperature": 0.0, + "avg_logprob": -0.12969079613685608, + "compression_ratio": 0.45454545454545453, + "no_speech_prob": 0.27970418334007263, + "confidence": 0.917, + "words": [ + { + "text": "1", + "start": 112.66, + "end": 113.32, + "confidence": 0.917 + } + ] + }, + { + "id": 57, + "seek": 11200, + "start": 113.98, + "end": 114.82, + "text": "1", + "tokens": [ + 50464, + 16, + 50564 + ], + "temperature": 0.0, + "avg_logprob": -0.12969079613685608, + "compression_ratio": 0.45454545454545453, + "no_speech_prob": 0.27970418334007263, + "confidence": 0.888, + "words": [ + { + "text": "1", + "start": 113.98, + "end": 114.82, + "confidence": 0.888 + } + ] + }, + { + "id": 58, + "seek": 11200, + "start": 116.1, + "end": 117.3, + "text": "1", + "tokens": [ + 50564, + 16, + 50664 + ], + "temperature": 0.0, + "avg_logprob": -0.12969079613685608, + "compression_ratio": 0.45454545454545453, + "no_speech_prob": 0.27970418334007263, + "confidence": 0.979, + "words": [ + { + "text": "1", + "start": 116.1, + "end": 117.3, + "confidence": 0.979 + } + ] + }, + { + "id": 59, + "seek": 11200, + "start": 117.5, + "end": 118.68, + "text": "1", + "tokens": [ + 50664, + 16, + 50764 + ], + "temperature": 0.0, + "avg_logprob": -0.12969079613685608, + "compression_ratio": 0.45454545454545453, + "no_speech_prob": 0.27970418334007263, + "confidence": 0.981, + "words": [ + { + "text": "1", + "start": 117.5, + "end": 118.68, + "confidence": 0.981 + } + ] + }, + { + "id": 60, + "seek": 11200, + "start": 119.5, + "end": 120.86, + "text": "1", + "tokens": [ + 50764, + 16, + 50864 + ], + "temperature": 0.0, + "avg_logprob": -0.12969079613685608, + "compression_ratio": 0.45454545454545453, + "no_speech_prob": 0.27970418334007263, + "confidence": 0.973, + "words": [ + { + "text": "1", + "start": 119.5, + "end": 120.86, + "confidence": 0.973 + } + ] + } + ], + "language": "zh", + "language_probs": { + "en": 0.3608749508857727, + "zh": 0.40258511900901794, + "de": 0.017688356339931488, + "es": 0.013351871632039547, + "ru": 0.024557847529649734, + "ko": 0.03202947601675987, + "fr": 0.010237235575914383, + "ja": 0.024944579228758812, + "pt": 0.014436815865337849, + "tr": 0.011968540027737617, + "pl": 0.0067137423902750015, + "ca": 0.0001964998955372721, + "nl": 0.0022488220129162073, + "ar": 0.006306977476924658, + "sv": 0.0012813402572646737, + "it": 0.005653538275510073, + "id": 0.0013428329257294536, + "hi": 0.001451948657631874, + "fi": 0.0006052622338756919, + "vi": 0.004614283796399832, + "he": 0.0003614185843616724, + "uk": 0.0006442983285523951, + "el": 0.0013015182921662927, + "ms": 0.0029792049899697304, + "cs": 0.0003728912561200559, + "ro": 0.000982437515631318, + "da": 0.00043595407623797655, + "hu": 0.0023202074225991964, + "ta": 0.00022616998467128724, + "no": 0.00028590564033947885, + "th": 0.0027553143445402384, + "ur": 0.0006244753021746874, + "hr": 5.992907608742826e-05, + "bg": 4.594921847456135e-05, + "lt": 1.0744692190201022e-05, + "la": 0.0025482492055743933, + "mi": 0.0003502989129628986, + "ml": 0.00017614134412724525, + "cy": 0.0029792049899697304, + "sk": 1.9762512238230556e-05, + "te": 0.00020273745758458972, + "fa": 0.0007300855941139162, + "lv": 2.2876768071000697e-06, + "bn": 0.00011372540757292882, + "sr": 2.552088062657276e-06, + "az": 2.1490734525286825e-06, + "sl": 3.2077721698442474e-05, + "kn": 6.868851301078394e-07, + "et": 2.0188676899124403e-06, + "mk": 3.244615527364658e-07, + "br": 0.0006752188201062381, + "eu": 2.4594843125669286e-05, + "is": 1.8857521354220808e-05, + "hy": 6.415948973881314e-06, + "ne": 2.3838139895815402e-05, + "mn": 1.9456123482086696e-05, + "bs": 2.0389841665746644e-05, + "kk": 2.0188676899124403e-06, + "sq": 1.8671472616915707e-06, + "sw": 1.1085765436291695e-05, + "gl": 0.00017341053171548992, + "mr": 1.6737000123612233e-06, + "pa": 4.996745246899081e-06, + "si": 0.00014376237231772393, + "km": 0.00041599024552851915, + "sn": 0.00018459455168340355, + "yo": 3.9302449295064434e-05, + "so": 1.7097923432629614e-07, + "af": 1.8097013025908382e-06, + "oc": 1.4458562873187475e-05, + "ka": 3.1943122280608804e-07, + "be": 3.8093239709269255e-05, + "tg": 6.14426696188275e-08, + "sd": 5.8417867876414675e-06, + "gu": 2.4111935204018664e-07, + "am": 1.9833936448776512e-07, + "yi": 1.025265646603657e-05, + "lo": 1.4458562873187475e-05, + "uz": 1.0760877522386636e-08, + "fo": 1.2175330084573943e-05, + "ht": 8.499750947521534e-06, + "ps": 1.198656900669448e-05, + "tk": 7.411401270474016e-08, + "nn": 0.02100544236600399, + "mt": 1.9374485304979316e-07, + "sa": 0.00014376237231772393, + "lb": 2.2253061615629122e-08, + "my": 0.00010517879854887724, + "bo": 2.1368370653362945e-05, + "tl": 0.0008144693565554917, + "mg": 1.0616341228342208e-07, + "as": 1.2055209026584635e-06, + "tt": 1.0594044752565424e-08, + "haw": 0.004989230073988438, + "ln": 2.689880886919127e-07, + "ha": 5.296689664646692e-08, + "ba": 7.239716381945982e-08, + "jw": 0.007373603526502848, + "su": 1.3954918642866687e-07 + } +} \ No newline at end of file diff --git a/tests/expected/medium_auto/smartphone.mp3.words.json b/tests/expected/medium_auto/smartphone.mp3.words.json new file mode 100644 index 0000000000000000000000000000000000000000..45164d8b8e4c657445fbb0687e46114bd1acb1b5 --- /dev/null +++ b/tests/expected/medium_auto/smartphone.mp3.words.json @@ -0,0 +1,5000 @@ +{ + "text": " C'est évident ce que dit Nicolas, mais je ne me l'étais jamais formulé comme ça. Ce qui fait la force du smartphone, c'est pas seulement l'accumulation des fonctions, mais la manière dont elles interagissent entre elles. Ce qui dit d'ailleurs sur la photo, c'est hyper convaincant. Alors évidemment, il faudrait ajouter les interfaces. L'écran tactile a été beaucoup très souvent mentionné. Mais bon, il faut dire qu'il profite aussi de 20 ans pendant lesquels les ordinateurs nous ont appris à cliquer sur des icônes. Sauf que le smartphone ajoute le toucher, ce qui rend le contact plus direct, plus sensible. Et puis évidemment, il faudrait parler aussi des applications qui permettent de contourner le côté touffu de la navigation web pour aller directement au but. Bref, tout ça, ce sont les conditions qui permettent de créer cet objet dont Nicolas dit qu'il est vraisemblablement inédit dans l'histoire de l'humanité. Mais ça, ça soulève une autre interrogation. Est-ce que le fait que cet objet soit inédit induit que notre rapport à lui est aussi un rapport inédit ? Je veux dire, est-ce que le rapport qu'on a au smartphone est comparable à celui qu'on entretenait à d'autres objets techniques comme la voiture ou le téléphone ? Il n'y a pas d'équivalent en fait. Et donc cette espèce de nouveauté dans la relation à l'objet, c'est fascinant et terrifiant. Parce qu'on a l'impression, comme le disent les utilisateurs et les services, d'être dépendant de cet objet, d'induire en fait une espèce de relation, de médiation avec le monde qui rend de l'ampleur et qui amène aussi à des formes de rejet. Donc à objet inédit, rapport inédit. Et ce rapport, si j'en crois à Nicolas, serait caractérisé par un mélange de dépendance et de rejet. Bon, en vrai, il faudrait remonter très très finement toute l'histoire des objets techniques et de leur insertion dans nos vies pour déterminer si ce rapport est totalement inédit. Mais j'ai l'impression comme ça que Nicolas ne se trompe pas vraiment. Pour autant que je sache, il y a eu plein de discussions autour de la voiture ou même du téléphone. Mais la dépendance n'était pas du même ordre. Donc le rejet non plus n'était pas du même ordre. On peut adorer sa bagnole, en avoir besoin pour plein de choses. Le soir, quand on va se coucher, on la laisse. On ne l'a pas dans la main quand on est au lit, on ne l'emmène pas au chiottes. On pouvait être énervé par son môme qui occupait la ligne de téléphone pendant une heure chaque soir pour discuter avec un copain. Mais ça ne ressemblait pas à ce qu'on peut ressentir à voir ce même môme aujourd'hui, continuellement avec son smartphone dans la main, comme si c'était une sorte de pacemaker externe, comme si le lâcher allait entraîner sa mort immédiate. Bon, je dis ça pour le môme, mais c'est évidemment valable pour nous aussi. Donc, rapport inédit, d'accord. Mais pourquoi a-t-on l'impression qu'on n'en sortira jamais ? Est-ce qu'il faut en remettre la faute sur les gens qui ont créé cet outil merveilleux et diabolique, et diabolique parce que merveilleux ? Les économistes parlent de dépendance du sentier. C'est l'idée qu'on met sur un sentier qui a été établi, soit volontairement en marchant dessus, soit en définissant des bornes, en définissant une signalétique.", + "segments": [ + { + "id": 0, + "seek": 0, + "start": 0.4, + "end": 3.66, + "text": " C'est évident ce que dit Nicolas, mais je ne me l'étais jamais formulé comme ça.", + "tokens": [ + 50364, + 383, + 6, + 377, + 20090, + 1078, + 1769, + 631, + 6176, + 38268, + 11, + 2420, + 1506, + 408, + 385, + 287, + 6, + 22824, + 14540, + 49990, + 526, + 5173, + 2788, + 13, + 50539 + ], + "temperature": 0.0, + "avg_logprob": -0.2362650940749819, + "compression_ratio": 1.6238532110091743, + "no_speech_prob": 0.15368737280368805, + "confidence": 0.935, + "words": [ + { + "text": "C'est", + "start": 0.4, + "end": 0.64, + "confidence": 0.961 + }, + { + "text": "évident", + "start": 0.64, + "end": 0.9, + "confidence": 0.984 + }, + { + "text": "ce", + "start": 0.9, + "end": 1.0, + "confidence": 0.663 + }, + { + "text": "que", + "start": 1.0, + "end": 1.08, + "confidence": 0.989 + }, + { + "text": "dit", + "start": 1.08, + "end": 1.2, + "confidence": 0.994 + }, + { + "text": "Nicolas,", + "start": 1.2, + "end": 1.48, + "confidence": 0.91 + }, + { + "text": "mais", + "start": 1.7, + "end": 2.04, + "confidence": 0.979 + }, + { + "text": "je", + "start": 2.04, + "end": 2.26, + "confidence": 0.981 + }, + { + "text": "ne", + "start": 2.26, + "end": 2.34, + "confidence": 0.837 + }, + { + "text": "me", + "start": 2.34, + "end": 2.36, + "confidence": 0.821 + }, + { + "text": "l'étais", + "start": 2.36, + "end": 2.58, + "confidence": 0.971 + }, + { + "text": "jamais", + "start": 2.58, + "end": 2.88, + "confidence": 0.989 + }, + { + "text": "formulé", + "start": 2.88, + "end": 3.26, + "confidence": 0.908 + }, + { + "text": "comme", + "start": 3.26, + "end": 3.44, + "confidence": 0.993 + }, + { + "text": "ça.", + "start": 3.44, + "end": 3.66, + "confidence": 0.975 + } + ] + }, + { + "id": 1, + "seek": 0, + "start": 4.16, + "end": 7.94, + "text": " Ce qui fait la force du smartphone, c'est pas seulement l'accumulation des fonctions,", + "tokens": [ + 50549, + 8257, + 1956, + 3887, + 635, + 3464, + 1581, + 13307, + 11, + 269, + 6, + 377, + 1736, + 27772, + 287, + 6, + 8476, + 449, + 2776, + 730, + 17290, + 3916, + 11, + 50756 + ], + "temperature": 0.0, + "avg_logprob": -0.2362650940749819, + "compression_ratio": 1.6238532110091743, + "no_speech_prob": 0.15368737280368805, + "confidence": 0.93, + "words": [ + { + "text": "Ce", + "start": 4.16, + "end": 4.28, + "confidence": 0.952 + }, + { + "text": "qui", + "start": 4.28, + "end": 4.36, + "confidence": 0.958 + }, + { + "text": "fait", + "start": 4.36, + "end": 4.5, + "confidence": 0.567 + }, + { + "text": "la", + "start": 4.5, + "end": 4.76, + "confidence": 0.972 + }, + { + "text": "force", + "start": 4.76, + "end": 5.02, + "confidence": 0.999 + }, + { + "text": "du", + "start": 5.02, + "end": 5.22, + "confidence": 0.996 + }, + { + "text": "smartphone,", + "start": 5.22, + "end": 5.7, + "confidence": 0.912 + }, + { + "text": "c'est", + "start": 6.04, + "end": 6.16, + "confidence": 0.879 + }, + { + "text": "pas", + "start": 6.16, + "end": 6.26, + "confidence": 0.991 + }, + { + "text": "seulement", + "start": 6.26, + "end": 6.54, + "confidence": 0.999 + }, + { + "text": "l'accumulation", + "start": 6.54, + "end": 7.4, + "confidence": 0.958 + }, + { + "text": "des", + "start": 7.4, + "end": 7.58, + "confidence": 0.983 + }, + { + "text": "fonctions,", + "start": 7.58, + "end": 7.94, + "confidence": 0.987 + } + ] + }, + { + "id": 2, + "seek": 0, + "start": 8.32, + "end": 10.88, + "text": " mais la manière dont elles interagissent entre elles.", + "tokens": [ + 50756, + 2420, + 635, + 22267, + 9400, + 23576, + 728, + 559, + 25450, + 3962, + 23576, + 13, + 50906 + ], + "temperature": 0.0, + "avg_logprob": -0.2362650940749819, + "compression_ratio": 1.6238532110091743, + "no_speech_prob": 0.15368737280368805, + "confidence": 0.977, + "words": [ + { + "text": "mais", + "start": 8.32, + "end": 8.48, + "confidence": 0.992 + }, + { + "text": "la", + "start": 8.48, + "end": 8.7, + "confidence": 0.995 + }, + { + "text": "manière", + "start": 8.7, + "end": 8.94, + "confidence": 0.999 + }, + { + "text": "dont", + "start": 8.94, + "end": 9.08, + "confidence": 0.978 + }, + { + "text": "elles", + "start": 9.08, + "end": 9.48, + "confidence": 0.967 + }, + { + "text": "interagissent", + "start": 9.48, + "end": 10.38, + "confidence": 0.964 + }, + { + "text": "entre", + "start": 10.38, + "end": 10.7, + "confidence": 0.955 + }, + { + "text": "elles.", + "start": 10.7, + "end": 10.88, + "confidence": 0.989 + } + ] + }, + { + "id": 3, + "seek": 0, + "start": 10.96, + "end": 13.0, + "text": " Ce qui dit d'ailleurs sur la photo, c'est hyper convaincant.", + "tokens": [ + 50906, + 8257, + 1956, + 6176, + 274, + 6, + 19400, + 1022, + 635, + 5052, + 11, + 269, + 6, + 377, + 9848, + 3754, + 491, + 66, + 394, + 13, + 51006 + ], + "temperature": 0.0, + "avg_logprob": -0.2362650940749819, + "compression_ratio": 1.6238532110091743, + "no_speech_prob": 0.15368737280368805, + "confidence": 0.906, + "words": [ + { + "text": "Ce", + "start": 10.96, + "end": 11.16, + "confidence": 0.608 + }, + { + "text": "qui", + "start": 11.16, + "end": 11.26, + "confidence": 0.769 + }, + { + "text": "dit", + "start": 11.26, + "end": 11.38, + "confidence": 0.983 + }, + { + "text": "d'ailleurs", + "start": 11.38, + "end": 11.58, + "confidence": 0.985 + }, + { + "text": "sur", + "start": 11.58, + "end": 11.72, + "confidence": 0.48 + }, + { + "text": "la", + "start": 11.72, + "end": 11.82, + "confidence": 0.984 + }, + { + "text": "photo,", + "start": 11.82, + "end": 12.0, + "confidence": 0.994 + }, + { + "text": "c'est", + "start": 12.14, + "end": 12.2, + "confidence": 0.997 + }, + { + "text": "hyper", + "start": 12.2, + "end": 12.48, + "confidence": 0.993 + }, + { + "text": "convaincant.", + "start": 12.48, + "end": 13.0, + "confidence": 0.982 + } + ] + }, + { + "id": 4, + "seek": 0, + "start": 13.38, + "end": 16.04, + "text": " Alors évidemment, il faudrait ajouter les interfaces.", + "tokens": [ + 51006, + 9946, + 24724, + 11, + 1930, + 38694, + 8645, + 17680, + 23985, + 1512, + 28416, + 13, + 51166 + ], + "temperature": 0.0, + "avg_logprob": -0.2362650940749819, + "compression_ratio": 1.6238532110091743, + "no_speech_prob": 0.15368737280368805, + "confidence": 0.912, + "words": [ + { + "text": "Alors", + "start": 13.38, + "end": 13.58, + "confidence": 0.584 + }, + { + "text": "évidemment,", + "start": 13.58, + "end": 13.86, + "confidence": 0.832 + }, + { + "text": "il", + "start": 14.26, + "end": 14.42, + "confidence": 0.953 + }, + { + "text": "faudrait", + "start": 14.42, + "end": 14.76, + "confidence": 0.996 + }, + { + "text": "ajouter", + "start": 14.76, + "end": 15.2, + "confidence": 0.992 + }, + { + "text": "les", + "start": 15.2, + "end": 15.6, + "confidence": 0.985 + }, + { + "text": "interfaces.", + "start": 15.6, + "end": 16.04, + "confidence": 0.984 + } + ] + }, + { + "id": 5, + "seek": 0, + "start": 16.22, + "end": 19.36, + "text": " L'écran tactile a été beaucoup très souvent mentionné.", + "tokens": [ + 51166, + 441, + 6, + 9062, + 4257, + 47319, + 257, + 8862, + 8796, + 5732, + 20847, + 2152, + 15055, + 13, + 51331 + ], + "temperature": 0.0, + "avg_logprob": -0.2362650940749819, + "compression_ratio": 1.6238532110091743, + "no_speech_prob": 0.15368737280368805, + "confidence": 0.923, + "words": [ + { + "text": "L'écran", + "start": 16.22, + "end": 16.78, + "confidence": 0.996 + }, + { + "text": "tactile", + "start": 16.78, + "end": 17.1, + "confidence": 0.986 + }, + { + "text": "a", + "start": 17.1, + "end": 17.3, + "confidence": 0.98 + }, + { + "text": "été", + "start": 17.3, + "end": 17.84, + "confidence": 0.974 + }, + { + "text": "beaucoup", + "start": 17.84, + "end": 18.28, + "confidence": 0.976 + }, + { + "text": "très", + "start": 18.28, + "end": 18.62, + "confidence": 0.447 + }, + { + "text": "souvent", + "start": 18.62, + "end": 18.9, + "confidence": 0.996 + }, + { + "text": "mentionné.", + "start": 18.9, + "end": 19.36, + "confidence": 0.978 + } + ] + }, + { + "id": 6, + "seek": 0, + "start": 20.02, + "end": 25.44, + "text": " Mais bon, il faut dire qu'il profite aussi de 20 ans pendant lesquels les ordinateurs nous ont appris à cliquer sur des icônes.", + "tokens": [ + 51331, + 6313, + 4428, + 11, + 1930, + 8487, + 1264, + 421, + 6, + 388, + 1740, + 642, + 6212, + 368, + 945, + 1567, + 17338, + 1512, + 358, + 1625, + 1512, + 4792, + 13923, + 2156, + 4666, + 6592, + 724, + 5714, + 1531, + 596, + 23909, + 1022, + 730, + 4376, + 2851, + 4081, + 13, + 51631 + ], + "temperature": 0.0, + "avg_logprob": -0.2362650940749819, + "compression_ratio": 1.6238532110091743, + "no_speech_prob": 0.15368737280368805, + "confidence": 0.92, + "words": [ + { + "text": "Mais", + "start": 20.02, + "end": 20.26, + "confidence": 0.943 + }, + { + "text": "bon,", + "start": 20.26, + "end": 20.5, + "confidence": 0.666 + }, + { + "text": "il", + "start": 20.52, + "end": 20.62, + "confidence": 0.99 + }, + { + "text": "faut", + "start": 20.62, + "end": 20.7, + "confidence": 0.99 + }, + { + "text": "dire", + "start": 20.7, + "end": 20.82, + "confidence": 0.995 + }, + { + "text": "qu'il", + "start": 20.82, + "end": 21.04, + "confidence": 0.88 + }, + { + "text": "profite", + "start": 21.04, + "end": 21.3, + "confidence": 0.995 + }, + { + "text": "aussi", + "start": 21.3, + "end": 21.7, + "confidence": 0.972 + }, + { + "text": "de", + "start": 21.7, + "end": 21.94, + "confidence": 0.97 + }, + { + "text": "20", + "start": 21.94, + "end": 22.16, + "confidence": 0.812 + }, + { + "text": "ans", + "start": 22.16, + "end": 22.3, + "confidence": 0.997 + }, + { + "text": "pendant", + "start": 22.3, + "end": 22.54, + "confidence": 0.723 + }, + { + "text": "lesquels", + "start": 22.54, + "end": 22.92, + "confidence": 0.98 + }, + { + "text": "les", + "start": 22.92, + "end": 23.14, + "confidence": 0.71 + }, + { + "text": "ordinateurs", + "start": 23.14, + "end": 23.58, + "confidence": 0.966 + }, + { + "text": "nous", + "start": 23.58, + "end": 23.74, + "confidence": 0.602 + }, + { + "text": "ont", + "start": 23.74, + "end": 23.88, + "confidence": 0.974 + }, + { + "text": "appris", + "start": 23.88, + "end": 24.12, + "confidence": 0.991 + }, + { + "text": "à", + "start": 24.12, + "end": 24.26, + "confidence": 0.828 + }, + { + "text": "cliquer", + "start": 24.26, + "end": 24.54, + "confidence": 0.989 + }, + { + "text": "sur", + "start": 24.54, + "end": 24.72, + "confidence": 0.984 + }, + { + "text": "des", + "start": 24.72, + "end": 24.92, + "confidence": 0.971 + }, + { + "text": "icônes.", + "start": 24.92, + "end": 25.44, + "confidence": 0.992 + } + ] + }, + { + "id": 7, + "seek": 2534, + "start": 25.54, + "end": 30.64, + "text": " Sauf que le smartphone ajoute le toucher, ce qui rend le contact plus direct, plus sensible.", + "tokens": [ + 50364, + 318, + 9507, + 631, + 476, + 13307, + 17680, + 14040, + 476, + 2557, + 260, + 11, + 1769, + 1956, + 6125, + 476, + 3385, + 1804, + 2047, + 11, + 1804, + 25380, + 13, + 50639 + ], + "temperature": 0.0, + "avg_logprob": -0.10785348191220537, + "compression_ratio": 1.6254416961130742, + "no_speech_prob": 0.18929888308048248, + "confidence": 0.968, + "words": [ + { + "text": "Sauf", + "start": 25.54, + "end": 25.82, + "confidence": 0.974 + }, + { + "text": "que", + "start": 25.82, + "end": 26.3, + "confidence": 0.996 + }, + { + "text": "le", + "start": 26.3, + "end": 26.66, + "confidence": 0.671 + }, + { + "text": "smartphone", + "start": 26.66, + "end": 27.08, + "confidence": 0.995 + }, + { + "text": "ajoute", + "start": 27.08, + "end": 27.48, + "confidence": 0.99 + }, + { + "text": "le", + "start": 27.48, + "end": 27.66, + "confidence": 0.989 + }, + { + "text": "toucher,", + "start": 27.66, + "end": 28.06, + "confidence": 0.987 + }, + { + "text": "ce", + "start": 28.14, + "end": 28.16, + "confidence": 0.952 + }, + { + "text": "qui", + "start": 28.16, + "end": 28.3, + "confidence": 1.0 + }, + { + "text": "rend", + "start": 28.3, + "end": 28.54, + "confidence": 0.994 + }, + { + "text": "le", + "start": 28.54, + "end": 28.8, + "confidence": 0.992 + }, + { + "text": "contact", + "start": 28.8, + "end": 29.16, + "confidence": 0.999 + }, + { + "text": "plus", + "start": 29.16, + "end": 29.58, + "confidence": 0.983 + }, + { + "text": "direct,", + "start": 29.58, + "end": 30.0, + "confidence": 0.991 + }, + { + "text": "plus", + "start": 30.1, + "end": 30.24, + "confidence": 0.99 + }, + { + "text": "sensible.", + "start": 30.24, + "end": 30.64, + "confidence": 0.997 + } + ] + }, + { + "id": 8, + "seek": 2534, + "start": 31.04, + "end": 37.82, + "text": " Et puis évidemment, il faudrait parler aussi des applications qui permettent de contourner le côté touffu de la navigation web pour aller directement au but.", + "tokens": [ + 50639, + 3790, + 9093, + 24724, + 11, + 1930, + 38694, + 8645, + 16421, + 6212, + 730, + 5821, + 1956, + 21540, + 317, + 368, + 21234, + 1193, + 476, + 18437, + 10095, + 602, + 84, + 368, + 635, + 17346, + 3670, + 2016, + 8722, + 37297, + 1609, + 457, + 13, + 50989 + ], + "temperature": 0.0, + "avg_logprob": -0.10785348191220537, + "compression_ratio": 1.6254416961130742, + "no_speech_prob": 0.18929888308048248, + "confidence": 0.893, + "words": [ + { + "text": "Et", + "start": 31.04, + "end": 31.24, + "confidence": 0.964 + }, + { + "text": "puis", + "start": 31.24, + "end": 31.34, + "confidence": 0.967 + }, + { + "text": "évidemment,", + "start": 31.34, + "end": 31.62, + "confidence": 0.87 + }, + { + "text": "il", + "start": 31.66, + "end": 31.72, + "confidence": 0.99 + }, + { + "text": "faudrait", + "start": 31.72, + "end": 31.94, + "confidence": 0.996 + }, + { + "text": "parler", + "start": 31.94, + "end": 32.16, + "confidence": 0.864 + }, + { + "text": "aussi", + "start": 32.16, + "end": 32.34, + "confidence": 0.971 + }, + { + "text": "des", + "start": 32.34, + "end": 32.48, + "confidence": 0.993 + }, + { + "text": "applications", + "start": 32.48, + "end": 32.92, + "confidence": 0.993 + }, + { + "text": "qui", + "start": 32.92, + "end": 33.22, + "confidence": 0.564 + }, + { + "text": "permettent", + "start": 33.22, + "end": 33.76, + "confidence": 0.99 + }, + { + "text": "de", + "start": 33.76, + "end": 33.98, + "confidence": 0.871 + }, + { + "text": "contourner", + "start": 33.98, + "end": 34.42, + "confidence": 0.953 + }, + { + "text": "le", + "start": 34.42, + "end": 34.54, + "confidence": 0.75 + }, + { + "text": "côté", + "start": 34.54, + "end": 34.78, + "confidence": 0.985 + }, + { + "text": "touffu", + "start": 34.78, + "end": 35.32, + "confidence": 0.726 + }, + { + "text": "de", + "start": 35.32, + "end": 35.7, + "confidence": 0.882 + }, + { + "text": "la", + "start": 35.7, + "end": 35.82, + "confidence": 0.991 + }, + { + "text": "navigation", + "start": 35.82, + "end": 36.3, + "confidence": 0.992 + }, + { + "text": "web", + "start": 36.3, + "end": 36.58, + "confidence": 0.847 + }, + { + "text": "pour", + "start": 36.58, + "end": 36.76, + "confidence": 0.59 + }, + { + "text": "aller", + "start": 36.76, + "end": 37.16, + "confidence": 0.981 + }, + { + "text": "directement", + "start": 37.16, + "end": 37.54, + "confidence": 0.997 + }, + { + "text": "au", + "start": 37.54, + "end": 37.7, + "confidence": 0.969 + }, + { + "text": "but.", + "start": 37.7, + "end": 37.82, + "confidence": 0.995 + } + ] + }, + { + "id": 9, + "seek": 2534, + "start": 37.9, + "end": 46.6, + "text": " Bref, tout ça, ce sont les conditions qui permettent de créer cet objet dont Nicolas dit qu'il est vraisemblablement inédit dans l'histoire de l'humanité.", + "tokens": [ + 50989, + 49957, + 11, + 3486, + 2788, + 11, + 1769, + 4900, + 1512, + 4487, + 1956, + 21540, + 317, + 368, + 32062, + 8603, + 14964, + 9400, + 38268, + 6176, + 421, + 6, + 388, + 871, + 6070, + 271, + 443, + 5199, + 712, + 518, + 294, + 7811, + 270, + 2680, + 287, + 6, + 29093, + 368, + 287, + 6, + 18796, + 5066, + 13, + 51439 + ], + "temperature": 0.0, + "avg_logprob": -0.10785348191220537, + "compression_ratio": 1.6254416961130742, + "no_speech_prob": 0.18929888308048248, + "confidence": 0.973, + "words": [ + { + "text": "Bref,", + "start": 37.9, + "end": 38.24, + "confidence": 0.984 + }, + { + "text": "tout", + "start": 38.88, + "end": 39.02, + "confidence": 0.701 + }, + { + "text": "ça,", + "start": 39.02, + "end": 39.4, + "confidence": 0.995 + }, + { + "text": "ce", + "start": 39.4, + "end": 39.72, + "confidence": 0.989 + }, + { + "text": "sont", + "start": 39.72, + "end": 39.92, + "confidence": 0.999 + }, + { + "text": "les", + "start": 39.92, + "end": 40.22, + "confidence": 0.992 + }, + { + "text": "conditions", + "start": 40.22, + "end": 40.7, + "confidence": 0.995 + }, + { + "text": "qui", + "start": 40.7, + "end": 41.02, + "confidence": 0.997 + }, + { + "text": "permettent", + "start": 41.02, + "end": 41.44, + "confidence": 0.996 + }, + { + "text": "de", + "start": 41.44, + "end": 41.74, + "confidence": 0.997 + }, + { + "text": "créer", + "start": 41.74, + "end": 42.1, + "confidence": 0.999 + }, + { + "text": "cet", + "start": 42.1, + "end": 42.38, + "confidence": 0.997 + }, + { + "text": "objet", + "start": 42.38, + "end": 42.64, + "confidence": 0.994 + }, + { + "text": "dont", + "start": 42.64, + "end": 42.84, + "confidence": 0.789 + }, + { + "text": "Nicolas", + "start": 42.84, + "end": 43.24, + "confidence": 0.988 + }, + { + "text": "dit", + "start": 43.24, + "end": 43.52, + "confidence": 0.986 + }, + { + "text": "qu'il", + "start": 43.52, + "end": 43.74, + "confidence": 0.982 + }, + { + "text": "est", + "start": 43.74, + "end": 43.94, + "confidence": 0.99 + }, + { + "text": "vraisemblablement", + "start": 43.94, + "end": 44.86, + "confidence": 0.99 + }, + { + "text": "inédit", + "start": 44.86, + "end": 45.44, + "confidence": 0.98 + }, + { + "text": "dans", + "start": 45.44, + "end": 45.72, + "confidence": 0.967 + }, + { + "text": "l'histoire", + "start": 45.72, + "end": 46.02, + "confidence": 0.958 + }, + { + "text": "de", + "start": 46.02, + "end": 46.14, + "confidence": 0.999 + }, + { + "text": "l'humanité.", + "start": 46.14, + "end": 46.6, + "confidence": 0.992 + } + ] + }, + { + "id": 10, + "seek": 2534, + "start": 47.02, + "end": 48.78, + "text": " Mais ça, ça soulève une autre interrogation.", + "tokens": [ + 51439, + 6313, + 2788, + 11, + 2788, + 5133, + 31397, + 2251, + 15081, + 24871, + 399, + 13, + 51539 + ], + "temperature": 0.0, + "avg_logprob": -0.10785348191220537, + "compression_ratio": 1.6254416961130742, + "no_speech_prob": 0.18929888308048248, + "confidence": 0.969, + "words": [ + { + "text": "Mais", + "start": 47.02, + "end": 47.28, + "confidence": 0.84 + }, + { + "text": "ça,", + "start": 47.28, + "end": 47.48, + "confidence": 0.942 + }, + { + "text": "ça", + "start": 47.62, + "end": 47.64, + "confidence": 0.976 + }, + { + "text": "soulève", + "start": 47.64, + "end": 47.86, + "confidence": 0.993 + }, + { + "text": "une", + "start": 47.86, + "end": 48.02, + "confidence": 0.998 + }, + { + "text": "autre", + "start": 48.02, + "end": 48.2, + "confidence": 0.999 + }, + { + "text": "interrogation.", + "start": 48.2, + "end": 48.78, + "confidence": 0.997 + } + ] + }, + { + "id": 11, + "seek": 4884, + "start": 49.36, + "end": 55.5, + "text": " Est-ce que le fait que cet objet soit inédit induit que notre rapport à lui est aussi un rapport inédit ?", + "tokens": [ + 50389, + 4410, + 12, + 384, + 631, + 476, + 3887, + 631, + 8603, + 14964, + 12703, + 294, + 7811, + 270, + 13716, + 270, + 631, + 10349, + 18018, + 1531, + 8783, + 871, + 6212, + 517, + 18018, + 294, + 7811, + 270, + 2506, + 50689 + ], + "temperature": 0.0, + "avg_logprob": -0.08241327932058287, + "compression_ratio": 1.5960784313725491, + "no_speech_prob": 0.09794807434082031, + "confidence": 0.986, + "words": [ + { + "text": "Est-ce", + "start": 49.36, + "end": 49.64, + "confidence": 0.978 + }, + { + "text": "que", + "start": 49.64, + "end": 49.76, + "confidence": 0.991 + }, + { + "text": "le", + "start": 49.76, + "end": 49.82, + "confidence": 0.993 + }, + { + "text": "fait", + "start": 49.82, + "end": 50.0, + "confidence": 0.999 + }, + { + "text": "que", + "start": 50.0, + "end": 50.14, + "confidence": 0.991 + }, + { + "text": "cet", + "start": 50.14, + "end": 50.32, + "confidence": 0.99 + }, + { + "text": "objet", + "start": 50.32, + "end": 50.66, + "confidence": 0.997 + }, + { + "text": "soit", + "start": 50.66, + "end": 51.12, + "confidence": 0.995 + }, + { + "text": "inédit", + "start": 51.12, + "end": 51.78, + "confidence": 0.995 + }, + { + "text": "induit", + "start": 51.78, + "end": 52.32, + "confidence": 0.955 + }, + { + "text": "que", + "start": 52.32, + "end": 52.42, + "confidence": 0.984 + }, + { + "text": "notre", + "start": 52.42, + "end": 52.78, + "confidence": 0.995 + }, + { + "text": "rapport", + "start": 52.78, + "end": 53.28, + "confidence": 0.997 + }, + { + "text": "à", + "start": 53.28, + "end": 53.46, + "confidence": 0.978 + }, + { + "text": "lui", + "start": 53.46, + "end": 53.68, + "confidence": 0.999 + }, + { + "text": "est", + "start": 53.68, + "end": 54.14, + "confidence": 0.907 + }, + { + "text": "aussi", + "start": 54.14, + "end": 54.52, + "confidence": 0.996 + }, + { + "text": "un", + "start": 54.52, + "end": 54.72, + "confidence": 0.994 + }, + { + "text": "rapport", + "start": 54.72, + "end": 55.0, + "confidence": 0.997 + }, + { + "text": "inédit ?", + "start": 55.0, + "end": 55.5, + "confidence": 0.996 + } + ] + }, + { + "id": 12, + "seek": 4884, + "start": 55.76, + "end": 63.4, + "text": " Je veux dire, est-ce que le rapport qu'on a au smartphone est comparable à celui qu'on entretenait à d'autres objets techniques comme la voiture ou le téléphone ?", + "tokens": [ + 50689, + 2588, + 16389, + 1264, + 11, + 871, + 12, + 384, + 631, + 476, + 18018, + 421, + 6, + 266, + 257, + 1609, + 13307, + 871, + 25323, + 1531, + 22829, + 421, + 6, + 266, + 3962, + 1147, + 1001, + 1531, + 274, + 6, + 16752, + 1111, + 25349, + 7512, + 5173, + 635, + 38859, + 2820, + 476, + 47159, + 2506, + 51089 + ], + "temperature": 0.0, + "avg_logprob": -0.08241327932058287, + "compression_ratio": 1.5960784313725491, + "no_speech_prob": 0.09794807434082031, + "confidence": 0.96, + "words": [ + { + "text": "Je", + "start": 55.76, + "end": 55.9, + "confidence": 0.904 + }, + { + "text": "veux", + "start": 55.9, + "end": 56.0, + "confidence": 0.989 + }, + { + "text": "dire,", + "start": 56.0, + "end": 56.12, + "confidence": 0.997 + }, + { + "text": "est-ce", + "start": 56.22, + "end": 56.38, + "confidence": 0.99 + }, + { + "text": "que", + "start": 56.38, + "end": 56.5, + "confidence": 0.991 + }, + { + "text": "le", + "start": 56.5, + "end": 56.66, + "confidence": 0.996 + }, + { + "text": "rapport", + "start": 56.66, + "end": 56.86, + "confidence": 0.998 + }, + { + "text": "qu'on", + "start": 56.86, + "end": 57.08, + "confidence": 0.985 + }, + { + "text": "a", + "start": 57.08, + "end": 57.16, + "confidence": 0.99 + }, + { + "text": "au", + "start": 57.16, + "end": 57.28, + "confidence": 0.966 + }, + { + "text": "smartphone", + "start": 57.28, + "end": 57.6, + "confidence": 0.995 + }, + { + "text": "est", + "start": 57.6, + "end": 57.86, + "confidence": 0.91 + }, + { + "text": "comparable", + "start": 57.86, + "end": 58.3, + "confidence": 0.996 + }, + { + "text": "à", + "start": 58.3, + "end": 58.5, + "confidence": 0.946 + }, + { + "text": "celui", + "start": 58.5, + "end": 58.66, + "confidence": 0.998 + }, + { + "text": "qu'on", + "start": 58.66, + "end": 58.96, + "confidence": 0.989 + }, + { + "text": "entretenait", + "start": 58.96, + "end": 59.36, + "confidence": 0.926 + }, + { + "text": "à", + "start": 59.36, + "end": 59.48, + "confidence": 0.951 + }, + { + "text": "d'autres", + "start": 59.48, + "end": 59.7, + "confidence": 0.997 + }, + { + "text": "objets", + "start": 59.7, + "end": 59.98, + "confidence": 0.99 + }, + { + "text": "techniques", + "start": 59.98, + "end": 60.44, + "confidence": 0.984 + }, + { + "text": "comme", + "start": 60.44, + "end": 60.96, + "confidence": 0.496 + }, + { + "text": "la", + "start": 60.96, + "end": 61.52, + "confidence": 0.987 + }, + { + "text": "voiture", + "start": 61.52, + "end": 62.08, + "confidence": 1.0 + }, + { + "text": "ou", + "start": 62.08, + "end": 62.52, + "confidence": 0.95 + }, + { + "text": "le", + "start": 62.52, + "end": 62.74, + "confidence": 0.998 + }, + { + "text": "téléphone ?", + "start": 62.74, + "end": 63.4, + "confidence": 0.999 + } + ] + }, + { + "id": 13, + "seek": 4884, + "start": 65.36, + "end": 66.62, + "text": " Il n'y a pas d'équivalent en fait.", + "tokens": [ + 51189, + 4416, + 297, + 6, + 88, + 257, + 1736, + 274, + 6, + 20183, + 3576, + 317, + 465, + 3887, + 13, + 51239 + ], + "temperature": 0.0, + "avg_logprob": -0.08241327932058287, + "compression_ratio": 1.5960784313725491, + "no_speech_prob": 0.09794807434082031, + "confidence": 0.94, + "words": [ + { + "text": "Il", + "start": 65.36, + "end": 65.5, + "confidence": 0.849 + }, + { + "text": "n'y", + "start": 65.5, + "end": 65.54, + "confidence": 0.979 + }, + { + "text": "a", + "start": 65.54, + "end": 65.56, + "confidence": 0.993 + }, + { + "text": "pas", + "start": 65.56, + "end": 65.66, + "confidence": 0.999 + }, + { + "text": "d'équivalent", + "start": 65.66, + "end": 66.3, + "confidence": 0.995 + }, + { + "text": "en", + "start": 66.3, + "end": 66.44, + "confidence": 0.582 + }, + { + "text": "fait.", + "start": 66.44, + "end": 66.62, + "confidence": 0.997 + } + ] + }, + { + "id": 14, + "seek": 4884, + "start": 66.88, + "end": 71.24, + "text": " Et donc cette espèce de nouveauté dans la relation à l'objet, c'est fascinant et terrifiant.", + "tokens": [ + 51239, + 3790, + 5926, + 5550, + 7089, + 30236, + 368, + 11456, + 1375, + 526, + 2680, + 635, + 9721, + 1531, + 287, + 6, + 996, + 7108, + 11, + 269, + 6, + 377, + 7184, + 259, + 394, + 1030, + 7245, + 351, + 5798, + 13, + 51489 + ], + "temperature": 0.0, + "avg_logprob": -0.08241327932058287, + "compression_ratio": 1.5960784313725491, + "no_speech_prob": 0.09794807434082031, + "confidence": 0.957, + "words": [ + { + "text": "Et", + "start": 66.88, + "end": 67.02, + "confidence": 0.654 + }, + { + "text": "donc", + "start": 67.02, + "end": 67.12, + "confidence": 0.901 + }, + { + "text": "cette", + "start": 67.12, + "end": 67.3, + "confidence": 0.713 + }, + { + "text": "espèce", + "start": 67.3, + "end": 67.54, + "confidence": 0.996 + }, + { + "text": "de", + "start": 67.54, + "end": 67.76, + "confidence": 0.999 + }, + { + "text": "nouveauté", + "start": 67.76, + "end": 68.48, + "confidence": 0.98 + }, + { + "text": "dans", + "start": 68.48, + "end": 68.84, + "confidence": 0.982 + }, + { + "text": "la", + "start": 68.84, + "end": 68.96, + "confidence": 0.995 + }, + { + "text": "relation", + "start": 68.96, + "end": 69.24, + "confidence": 0.998 + }, + { + "text": "à", + "start": 69.24, + "end": 69.38, + "confidence": 0.997 + }, + { + "text": "l'objet,", + "start": 69.38, + "end": 70.0, + "confidence": 0.998 + }, + { + "text": "c'est", + "start": 70.28, + "end": 70.38, + "confidence": 0.977 + }, + { + "text": "fascinant", + "start": 70.38, + "end": 70.68, + "confidence": 0.98 + }, + { + "text": "et", + "start": 70.68, + "end": 70.76, + "confidence": 0.973 + }, + { + "text": "terrifiant.", + "start": 70.76, + "end": 71.24, + "confidence": 0.977 + } + ] + }, + { + "id": 15, + "seek": 7134, + "start": 71.62, + "end": 76.42, + "text": " Parce qu'on a l'impression, comme le disent les utilisateurs et les services, d'être dépendant de cet objet,", + "tokens": [ + 50389, + 20429, + 421, + 6, + 266, + 257, + 287, + 6, + 36107, + 11, + 5173, + 476, + 37313, + 1512, + 33643, + 25929, + 1030, + 1512, + 3328, + 11, + 274, + 6, + 9498, + 45768, + 394, + 368, + 8603, + 14964, + 11, + 50639 + ], + "temperature": 0.0, + "avg_logprob": -0.11220460018869173, + "compression_ratio": 1.5975609756097562, + "no_speech_prob": 0.015181643888354301, + "confidence": 0.862, + "words": [ + { + "text": "Parce", + "start": 71.62, + "end": 71.9, + "confidence": 0.843 + }, + { + "text": "qu'on", + "start": 71.9, + "end": 72.4, + "confidence": 0.968 + }, + { + "text": "a", + "start": 72.4, + "end": 72.54, + "confidence": 0.979 + }, + { + "text": "l'impression,", + "start": 72.54, + "end": 72.9, + "confidence": 0.997 + }, + { + "text": "comme", + "start": 73.66, + "end": 73.9, + "confidence": 0.982 + }, + { + "text": "le", + "start": 73.9, + "end": 74.02, + "confidence": 0.984 + }, + { + "text": "disent", + "start": 74.02, + "end": 74.22, + "confidence": 0.997 + }, + { + "text": "les", + "start": 74.22, + "end": 74.52, + "confidence": 0.996 + }, + { + "text": "utilisateurs", + "start": 74.52, + "end": 74.84, + "confidence": 0.998 + }, + { + "text": "et", + "start": 74.84, + "end": 74.94, + "confidence": 0.845 + }, + { + "text": "les", + "start": 74.94, + "end": 75.02, + "confidence": 0.783 + }, + { + "text": "services,", + "start": 75.02, + "end": 75.18, + "confidence": 0.129 + }, + { + "text": "d'être", + "start": 75.22, + "end": 75.5, + "confidence": 0.935 + }, + { + "text": "dépendant", + "start": 75.5, + "end": 75.98, + "confidence": 0.709 + }, + { + "text": "de", + "start": 75.98, + "end": 76.08, + "confidence": 0.977 + }, + { + "text": "cet", + "start": 76.08, + "end": 76.26, + "confidence": 0.998 + }, + { + "text": "objet,", + "start": 76.26, + "end": 76.42, + "confidence": 0.997 + } + ] + }, + { + "id": 16, + "seek": 7134, + "start": 76.42, + "end": 83.3, + "text": " d'induire en fait une espèce de relation, de médiation avec le monde qui rend de l'ampleur et qui amène aussi à des formes de rejet.", + "tokens": [ + 50639, + 274, + 6, + 471, + 43612, + 465, + 3887, + 2251, + 7089, + 30236, + 368, + 9721, + 11, + 368, + 42436, + 399, + 4163, + 476, + 10431, + 1956, + 6125, + 368, + 287, + 6, + 335, + 781, + 374, + 1030, + 1956, + 669, + 18832, + 6212, + 1531, + 730, + 1254, + 279, + 368, + 319, + 7108, + 13, + 50989 + ], + "temperature": 0.0, + "avg_logprob": -0.11220460018869173, + "compression_ratio": 1.5975609756097562, + "no_speech_prob": 0.015181643888354301, + "confidence": 0.923, + "words": [ + { + "text": "d'induire", + "start": 76.42, + "end": 77.1, + "confidence": 0.964 + }, + { + "text": "en", + "start": 77.1, + "end": 77.18, + "confidence": 0.72 + }, + { + "text": "fait", + "start": 77.18, + "end": 77.34, + "confidence": 0.997 + }, + { + "text": "une", + "start": 77.34, + "end": 77.5, + "confidence": 0.979 + }, + { + "text": "espèce", + "start": 77.5, + "end": 77.88, + "confidence": 0.997 + }, + { + "text": "de", + "start": 77.88, + "end": 78.28, + "confidence": 0.997 + }, + { + "text": "relation,", + "start": 78.28, + "end": 78.54, + "confidence": 0.422 + }, + { + "text": "de", + "start": 78.66, + "end": 78.96, + "confidence": 0.992 + }, + { + "text": "médiation", + "start": 78.96, + "end": 79.52, + "confidence": 0.997 + }, + { + "text": "avec", + "start": 79.52, + "end": 79.76, + "confidence": 0.954 + }, + { + "text": "le", + "start": 79.76, + "end": 80.02, + "confidence": 0.998 + }, + { + "text": "monde", + "start": 80.02, + "end": 80.3, + "confidence": 0.996 + }, + { + "text": "qui", + "start": 80.3, + "end": 81.24, + "confidence": 0.661 + }, + { + "text": "rend", + "start": 81.24, + "end": 81.66, + "confidence": 0.968 + }, + { + "text": "de", + "start": 81.66, + "end": 81.74, + "confidence": 0.688 + }, + { + "text": "l'ampleur", + "start": 81.74, + "end": 82.02, + "confidence": 0.995 + }, + { + "text": "et", + "start": 82.02, + "end": 82.1, + "confidence": 0.952 + }, + { + "text": "qui", + "start": 82.1, + "end": 82.2, + "confidence": 0.987 + }, + { + "text": "amène", + "start": 82.2, + "end": 82.38, + "confidence": 0.971 + }, + { + "text": "aussi", + "start": 82.38, + "end": 82.54, + "confidence": 0.946 + }, + { + "text": "à", + "start": 82.54, + "end": 82.62, + "confidence": 0.959 + }, + { + "text": "des", + "start": 82.62, + "end": 82.7, + "confidence": 0.992 + }, + { + "text": "formes", + "start": 82.7, + "end": 82.88, + "confidence": 0.995 + }, + { + "text": "de", + "start": 82.88, + "end": 83.04, + "confidence": 0.998 + }, + { + "text": "rejet.", + "start": 83.04, + "end": 83.3, + "confidence": 0.802 + } + ] + }, + { + "id": 17, + "seek": 7134, + "start": 83.92, + "end": 87.7, + "text": " Donc à objet inédit, rapport inédit.", + "tokens": [ + 50989, + 7477, + 1531, + 14964, + 294, + 7811, + 270, + 11, + 18018, + 294, + 7811, + 270, + 13, + 51189 + ], + "temperature": 0.0, + "avg_logprob": -0.11220460018869173, + "compression_ratio": 1.5975609756097562, + "no_speech_prob": 0.015181643888354301, + "confidence": 0.901, + "words": [ + { + "text": "Donc", + "start": 83.92, + "end": 84.46, + "confidence": 0.984 + }, + { + "text": "à", + "start": 84.46, + "end": 84.98, + "confidence": 0.483 + }, + { + "text": "objet", + "start": 84.98, + "end": 85.46, + "confidence": 0.77 + }, + { + "text": "inédit,", + "start": 85.46, + "end": 86.2, + "confidence": 0.994 + }, + { + "text": "rapport", + "start": 86.54, + "end": 86.9, + "confidence": 0.986 + }, + { + "text": "inédit.", + "start": 86.9, + "end": 87.7, + "confidence": 0.998 + } + ] + }, + { + "id": 18, + "seek": 7134, + "start": 88.02, + "end": 94.92, + "text": " Et ce rapport, si j'en crois à Nicolas, serait caractérisé par un mélange de dépendance et de rejet.", + "tokens": [ + 51189, + 3790, + 1769, + 18018, + 11, + 1511, + 361, + 6, + 268, + 21724, + 1531, + 38268, + 11, + 23139, + 1032, + 578, + 4198, + 22118, + 971, + 517, + 41953, + 933, + 368, + 45768, + 719, + 1030, + 368, + 319, + 7108, + 13, + 51539 + ], + "temperature": 0.0, + "avg_logprob": -0.11220460018869173, + "compression_ratio": 1.5975609756097562, + "no_speech_prob": 0.015181643888354301, + "confidence": 0.975, + "words": [ + { + "text": "Et", + "start": 88.02, + "end": 88.62, + "confidence": 0.989 + }, + { + "text": "ce", + "start": 88.62, + "end": 88.9, + "confidence": 0.985 + }, + { + "text": "rapport,", + "start": 88.9, + "end": 89.32, + "confidence": 0.998 + }, + { + "text": "si", + "start": 89.38, + "end": 89.56, + "confidence": 0.999 + }, + { + "text": "j'en", + "start": 89.56, + "end": 89.78, + "confidence": 0.997 + }, + { + "text": "crois", + "start": 89.78, + "end": 89.88, + "confidence": 0.988 + }, + { + "text": "à", + "start": 89.88, + "end": 90.06, + "confidence": 0.724 + }, + { + "text": "Nicolas,", + "start": 90.06, + "end": 90.24, + "confidence": 0.997 + }, + { + "text": "serait", + "start": 90.7, + "end": 91.0, + "confidence": 0.904 + }, + { + "text": "caractérisé", + "start": 91.0, + "end": 91.8, + "confidence": 0.994 + }, + { + "text": "par", + "start": 91.8, + "end": 92.22, + "confidence": 0.995 + }, + { + "text": "un", + "start": 92.22, + "end": 92.52, + "confidence": 0.996 + }, + { + "text": "mélange", + "start": 92.52, + "end": 93.04, + "confidence": 0.999 + }, + { + "text": "de", + "start": 93.04, + "end": 93.46, + "confidence": 0.998 + }, + { + "text": "dépendance", + "start": 93.46, + "end": 94.12, + "confidence": 0.938 + }, + { + "text": "et", + "start": 94.12, + "end": 94.54, + "confidence": 0.998 + }, + { + "text": "de", + "start": 94.54, + "end": 94.72, + "confidence": 0.999 + }, + { + "text": "rejet.", + "start": 94.72, + "end": 94.92, + "confidence": 0.988 + } + ] + }, + { + "id": 19, + "seek": 9484, + "start": 95.74, + "end": 102.82, + "text": " Bon, en vrai, il faudrait remonter très très finement toute l'histoire des objets techniques et de leur insertion dans nos vies", + "tokens": [ + 50389, + 7368, + 11, + 465, + 17815, + 11, + 1930, + 38694, + 8645, + 890, + 41806, + 5732, + 5732, + 962, + 1712, + 14953, + 287, + 6, + 29093, + 730, + 1111, + 25349, + 7512, + 1030, + 368, + 9580, + 8969, + 313, + 2680, + 3269, + 371, + 530, + 50739 + ], + "temperature": 0.0, + "avg_logprob": -0.0781538827078683, + "compression_ratio": 1.6719745222929936, + "no_speech_prob": 0.017434891313314438, + "confidence": 0.932, + "words": [ + { + "text": "Bon,", + "start": 95.74, + "end": 96.0, + "confidence": 0.751 + }, + { + "text": "en", + "start": 96.34, + "end": 96.54, + "confidence": 0.992 + }, + { + "text": "vrai,", + "start": 96.54, + "end": 96.86, + "confidence": 0.991 + }, + { + "text": "il", + "start": 97.06, + "end": 97.18, + "confidence": 0.992 + }, + { + "text": "faudrait", + "start": 97.18, + "end": 97.58, + "confidence": 0.996 + }, + { + "text": "remonter", + "start": 97.58, + "end": 98.06, + "confidence": 0.995 + }, + { + "text": "très", + "start": 98.06, + "end": 98.58, + "confidence": 0.995 + }, + { + "text": "très", + "start": 98.58, + "end": 98.84, + "confidence": 0.757 + }, + { + "text": "finement", + "start": 98.84, + "end": 99.38, + "confidence": 0.823 + }, + { + "text": "toute", + "start": 99.38, + "end": 99.7, + "confidence": 0.937 + }, + { + "text": "l'histoire", + "start": 99.7, + "end": 100.08, + "confidence": 0.996 + }, + { + "text": "des", + "start": 100.08, + "end": 100.26, + "confidence": 0.991 + }, + { + "text": "objets", + "start": 100.26, + "end": 100.52, + "confidence": 0.998 + }, + { + "text": "techniques", + "start": 100.52, + "end": 100.94, + "confidence": 0.982 + }, + { + "text": "et", + "start": 100.94, + "end": 101.54, + "confidence": 0.512 + }, + { + "text": "de", + "start": 101.54, + "end": 101.7, + "confidence": 0.984 + }, + { + "text": "leur", + "start": 101.7, + "end": 101.84, + "confidence": 0.818 + }, + { + "text": "insertion", + "start": 101.84, + "end": 102.34, + "confidence": 0.994 + }, + { + "text": "dans", + "start": 102.34, + "end": 102.5, + "confidence": 0.969 + }, + { + "text": "nos", + "start": 102.5, + "end": 102.66, + "confidence": 0.998 + }, + { + "text": "vies", + "start": 102.66, + "end": 102.82, + "confidence": 0.998 + } + ] + }, + { + "id": 20, + "seek": 9484, + "start": 102.86, + "end": 105.72, + "text": " pour déterminer si ce rapport est totalement inédit.", + "tokens": [ + 50739, + 2016, + 2795, + 29725, + 260, + 1511, + 1769, + 18018, + 871, + 45203, + 294, + 7811, + 270, + 13, + 50889 + ], + "temperature": 0.0, + "avg_logprob": -0.0781538827078683, + "compression_ratio": 1.6719745222929936, + "no_speech_prob": 0.017434891313314438, + "confidence": 0.995, + "words": [ + { + "text": "pour", + "start": 102.86, + "end": 103.1, + "confidence": 0.989 + }, + { + "text": "déterminer", + "start": 103.1, + "end": 103.64, + "confidence": 0.995 + }, + { + "text": "si", + "start": 103.64, + "end": 103.76, + "confidence": 0.986 + }, + { + "text": "ce", + "start": 103.76, + "end": 103.94, + "confidence": 0.991 + }, + { + "text": "rapport", + "start": 103.94, + "end": 104.26, + "confidence": 0.998 + }, + { + "text": "est", + "start": 104.26, + "end": 104.84, + "confidence": 0.997 + }, + { + "text": "totalement", + "start": 104.84, + "end": 105.3, + "confidence": 0.998 + }, + { + "text": "inédit.", + "start": 105.3, + "end": 105.72, + "confidence": 0.998 + } + ] + }, + { + "id": 21, + "seek": 9484, + "start": 106.14, + "end": 109.32, + "text": " Mais j'ai l'impression comme ça que Nicolas ne se trompe pas vraiment.", + "tokens": [ + 50889, + 6313, + 361, + 6, + 1301, + 287, + 6, + 36107, + 5173, + 2788, + 631, + 38268, + 408, + 369, + 504, + 298, + 494, + 1736, + 8322, + 13, + 51089 + ], + "temperature": 0.0, + "avg_logprob": -0.0781538827078683, + "compression_ratio": 1.6719745222929936, + "no_speech_prob": 0.017434891313314438, + "confidence": 0.932, + "words": [ + { + "text": "Mais", + "start": 106.14, + "end": 106.4, + "confidence": 0.975 + }, + { + "text": "j'ai", + "start": 106.4, + "end": 106.92, + "confidence": 0.956 + }, + { + "text": "l'impression", + "start": 106.92, + "end": 107.38, + "confidence": 0.999 + }, + { + "text": "comme", + "start": 107.38, + "end": 107.58, + "confidence": 0.513 + }, + { + "text": "ça", + "start": 107.58, + "end": 107.82, + "confidence": 0.969 + }, + { + "text": "que", + "start": 107.82, + "end": 108.14, + "confidence": 0.973 + }, + { + "text": "Nicolas", + "start": 108.14, + "end": 108.48, + "confidence": 0.983 + }, + { + "text": "ne", + "start": 108.48, + "end": 108.6, + "confidence": 0.72 + }, + { + "text": "se", + "start": 108.6, + "end": 108.72, + "confidence": 0.992 + }, + { + "text": "trompe", + "start": 108.72, + "end": 108.88, + "confidence": 0.993 + }, + { + "text": "pas", + "start": 108.88, + "end": 109.08, + "confidence": 0.999 + }, + { + "text": "vraiment.", + "start": 109.08, + "end": 109.32, + "confidence": 0.989 + } + ] + }, + { + "id": 22, + "seek": 9484, + "start": 109.94, + "end": 115.06, + "text": " Pour autant que je sache, il y a eu plein de discussions autour de la voiture ou même du téléphone.", + "tokens": [ + 51089, + 8732, + 34081, + 631, + 1506, + 262, + 6000, + 11, + 1930, + 288, + 257, + 2228, + 21088, + 368, + 11088, + 30249, + 368, + 635, + 38859, + 2820, + 5698, + 1581, + 47159, + 13, + 51389 + ], + "temperature": 0.0, + "avg_logprob": -0.0781538827078683, + "compression_ratio": 1.6719745222929936, + "no_speech_prob": 0.017434891313314438, + "confidence": 0.964, + "words": [ + { + "text": "Pour", + "start": 109.94, + "end": 110.1, + "confidence": 0.995 + }, + { + "text": "autant", + "start": 110.1, + "end": 110.24, + "confidence": 1.0 + }, + { + "text": "que", + "start": 110.24, + "end": 110.38, + "confidence": 0.984 + }, + { + "text": "je", + "start": 110.38, + "end": 110.52, + "confidence": 0.998 + }, + { + "text": "sache,", + "start": 110.52, + "end": 110.84, + "confidence": 0.952 + }, + { + "text": "il", + "start": 111.08, + "end": 111.16, + "confidence": 0.994 + }, + { + "text": "y", + "start": 111.16, + "end": 111.3, + "confidence": 0.995 + }, + { + "text": "a", + "start": 111.3, + "end": 111.32, + "confidence": 0.993 + }, + { + "text": "eu", + "start": 111.32, + "end": 111.62, + "confidence": 0.998 + }, + { + "text": "plein", + "start": 111.62, + "end": 111.9, + "confidence": 0.966 + }, + { + "text": "de", + "start": 111.9, + "end": 112.14, + "confidence": 0.997 + }, + { + "text": "discussions", + "start": 112.14, + "end": 112.66, + "confidence": 0.83 + }, + { + "text": "autour", + "start": 112.66, + "end": 113.02, + "confidence": 0.995 + }, + { + "text": "de", + "start": 113.02, + "end": 113.38, + "confidence": 0.996 + }, + { + "text": "la", + "start": 113.38, + "end": 113.52, + "confidence": 0.998 + }, + { + "text": "voiture", + "start": 113.52, + "end": 113.88, + "confidence": 1.0 + }, + { + "text": "ou", + "start": 113.88, + "end": 114.06, + "confidence": 0.69 + }, + { + "text": "même", + "start": 114.06, + "end": 114.34, + "confidence": 0.995 + }, + { + "text": "du", + "start": 114.34, + "end": 114.64, + "confidence": 0.992 + }, + { + "text": "téléphone.", + "start": 114.64, + "end": 115.06, + "confidence": 0.999 + } + ] + }, + { + "id": 23, + "seek": 9484, + "start": 115.48, + "end": 117.7, + "text": " Mais la dépendance n'était pas du même ordre.", + "tokens": [ + 51389, + 6313, + 635, + 45768, + 719, + 297, + 6, + 9743, + 1736, + 1581, + 5698, + 4792, + 265, + 13, + 51489 + ], + "temperature": 0.0, + "avg_logprob": -0.0781538827078683, + "compression_ratio": 1.6719745222929936, + "no_speech_prob": 0.017434891313314438, + "confidence": 0.992, + "words": [ + { + "text": "Mais", + "start": 115.48, + "end": 115.78, + "confidence": 0.993 + }, + { + "text": "la", + "start": 115.78, + "end": 116.04, + "confidence": 0.943 + }, + { + "text": "dépendance", + "start": 116.04, + "end": 116.42, + "confidence": 0.996 + }, + { + "text": "n'était", + "start": 116.42, + "end": 116.7, + "confidence": 0.994 + }, + { + "text": "pas", + "start": 116.7, + "end": 117.0, + "confidence": 0.998 + }, + { + "text": "du", + "start": 117.0, + "end": 117.2, + "confidence": 0.996 + }, + { + "text": "même", + "start": 117.2, + "end": 117.44, + "confidence": 0.998 + }, + { + "text": "ordre.", + "start": 117.44, + "end": 117.7, + "confidence": 0.999 + } + ] + }, + { + "id": 24, + "seek": 9484, + "start": 117.72, + "end": 119.78, + "text": " Donc le rejet non plus n'était pas du même ordre.", + "tokens": [ + 51489, + 7477, + 476, + 319, + 7108, + 2107, + 1804, + 297, + 6, + 9743, + 1736, + 1581, + 5698, + 4792, + 265, + 13, + 51589 + ], + "temperature": 0.0, + "avg_logprob": -0.0781538827078683, + "compression_ratio": 1.6719745222929936, + "no_speech_prob": 0.017434891313314438, + "confidence": 0.979, + "words": [ + { + "text": "Donc", + "start": 117.72, + "end": 118.02, + "confidence": 0.959 + }, + { + "text": "le", + "start": 118.02, + "end": 118.4, + "confidence": 0.819 + }, + { + "text": "rejet", + "start": 118.4, + "end": 118.64, + "confidence": 0.999 + }, + { + "text": "non", + "start": 118.64, + "end": 118.82, + "confidence": 0.982 + }, + { + "text": "plus", + "start": 118.82, + "end": 118.94, + "confidence": 0.994 + }, + { + "text": "n'était", + "start": 118.94, + "end": 119.18, + "confidence": 0.991 + }, + { + "text": "pas", + "start": 119.18, + "end": 119.3, + "confidence": 0.998 + }, + { + "text": "du", + "start": 119.3, + "end": 119.42, + "confidence": 0.995 + }, + { + "text": "même", + "start": 119.42, + "end": 119.58, + "confidence": 0.999 + }, + { + "text": "ordre.", + "start": 119.58, + "end": 119.78, + "confidence": 0.999 + } + ] + }, + { + "id": 25, + "seek": 9484, + "start": 120.04, + "end": 123.1, + "text": " On peut adorer sa bagnole, en avoir besoin pour plein de choses.", + "tokens": [ + 51589, + 1282, + 5977, + 614, + 17618, + 601, + 3411, + 1771, + 306, + 11, + 465, + 10853, + 19207, + 2016, + 21088, + 368, + 14488, + 13, + 51789 + ], + "temperature": 0.0, + "avg_logprob": -0.0781538827078683, + "compression_ratio": 1.6719745222929936, + "no_speech_prob": 0.017434891313314438, + "confidence": 0.971, + "words": [ + { + "text": "On", + "start": 120.04, + "end": 120.16, + "confidence": 0.757 + }, + { + "text": "peut", + "start": 120.16, + "end": 120.36, + "confidence": 0.997 + }, + { + "text": "adorer", + "start": 120.36, + "end": 120.68, + "confidence": 0.991 + }, + { + "text": "sa", + "start": 120.68, + "end": 120.88, + "confidence": 0.98 + }, + { + "text": "bagnole,", + "start": 120.88, + "end": 121.34, + "confidence": 0.985 + }, + { + "text": "en", + "start": 121.42, + "end": 121.56, + "confidence": 0.971 + }, + { + "text": "avoir", + "start": 121.56, + "end": 121.8, + "confidence": 0.997 + }, + { + "text": "besoin", + "start": 121.8, + "end": 122.12, + "confidence": 0.999 + }, + { + "text": "pour", + "start": 122.12, + "end": 122.46, + "confidence": 0.989 + }, + { + "text": "plein", + "start": 122.46, + "end": 122.7, + "confidence": 0.987 + }, + { + "text": "de", + "start": 122.7, + "end": 122.78, + "confidence": 0.997 + }, + { + "text": "choses.", + "start": 122.78, + "end": 123.1, + "confidence": 0.99 + } + ] + }, + { + "id": 26, + "seek": 12334, + "start": 123.38, + "end": 126.44, + "text": " Le soir, quand on va se coucher, on la laisse.", + "tokens": [ + 50389, + 1456, + 27105, + 11, + 6932, + 322, + 2773, + 369, + 1384, + 6759, + 11, + 322, + 635, + 30969, + 13, + 50539 + ], + "temperature": 0.0, + "avg_logprob": -0.08272041363662548, + "compression_ratio": 1.6818181818181819, + "no_speech_prob": 0.01115426979959011, + "confidence": 0.94, + "words": [ + { + "text": "Le", + "start": 123.38, + "end": 123.96, + "confidence": 0.645 + }, + { + "text": "soir,", + "start": 123.96, + "end": 124.54, + "confidence": 0.998 + }, + { + "text": "quand", + "start": 124.74, + "end": 124.94, + "confidence": 0.982 + }, + { + "text": "on", + "start": 124.94, + "end": 125.06, + "confidence": 0.996 + }, + { + "text": "va", + "start": 125.06, + "end": 125.16, + "confidence": 0.99 + }, + { + "text": "se", + "start": 125.16, + "end": 125.26, + "confidence": 0.989 + }, + { + "text": "coucher,", + "start": 125.26, + "end": 125.7, + "confidence": 0.989 + }, + { + "text": "on", + "start": 125.94, + "end": 126.04, + "confidence": 0.992 + }, + { + "text": "la", + "start": 126.04, + "end": 126.18, + "confidence": 0.852 + }, + { + "text": "laisse.", + "start": 126.18, + "end": 126.44, + "confidence": 0.999 + } + ] + }, + { + "id": 27, + "seek": 12334, + "start": 127.0, + "end": 130.3, + "text": " On ne l'a pas dans la main quand on est au lit, on ne l'emmène pas au chiottes.", + "tokens": [ + 50539, + 1282, + 408, + 287, + 6, + 64, + 1736, + 2680, + 635, + 2135, + 6932, + 322, + 871, + 1609, + 7997, + 11, + 322, + 408, + 287, + 6, + 443, + 76, + 18832, + 1736, + 1609, + 13228, + 1521, + 279, + 13, + 50739 + ], + "temperature": 0.0, + "avg_logprob": -0.08272041363662548, + "compression_ratio": 1.6818181818181819, + "no_speech_prob": 0.01115426979959011, + "confidence": 0.918, + "words": [ + { + "text": "On", + "start": 127.0, + "end": 127.34, + "confidence": 0.967 + }, + { + "text": "ne", + "start": 127.34, + "end": 127.46, + "confidence": 0.801 + }, + { + "text": "l'a", + "start": 127.46, + "end": 127.56, + "confidence": 0.929 + }, + { + "text": "pas", + "start": 127.56, + "end": 127.68, + "confidence": 0.999 + }, + { + "text": "dans", + "start": 127.68, + "end": 127.86, + "confidence": 0.992 + }, + { + "text": "la", + "start": 127.86, + "end": 128.08, + "confidence": 0.996 + }, + { + "text": "main", + "start": 128.08, + "end": 128.26, + "confidence": 0.999 + }, + { + "text": "quand", + "start": 128.26, + "end": 128.48, + "confidence": 0.936 + }, + { + "text": "on", + "start": 128.48, + "end": 128.6, + "confidence": 0.993 + }, + { + "text": "est", + "start": 128.6, + "end": 128.74, + "confidence": 0.992 + }, + { + "text": "au", + "start": 128.74, + "end": 128.94, + "confidence": 0.976 + }, + { + "text": "lit,", + "start": 128.94, + "end": 129.1, + "confidence": 0.999 + }, + { + "text": "on", + "start": 129.16, + "end": 129.28, + "confidence": 0.43 + }, + { + "text": "ne", + "start": 129.28, + "end": 129.3, + "confidence": 0.949 + }, + { + "text": "l'emmène", + "start": 129.3, + "end": 129.58, + "confidence": 0.993 + }, + { + "text": "pas", + "start": 129.58, + "end": 129.7, + "confidence": 0.997 + }, + { + "text": "au", + "start": 129.7, + "end": 129.88, + "confidence": 0.72 + }, + { + "text": "chiottes.", + "start": 129.88, + "end": 130.3, + "confidence": 0.886 + } + ] + }, + { + "id": 28, + "seek": 12334, + "start": 130.84, + "end": 136.88, + "text": " On pouvait être énervé par son môme qui occupait la ligne de téléphone pendant une heure chaque soir pour discuter avec un copain.", + "tokens": [ + 50739, + 1282, + 45913, + 7418, + 45045, + 15797, + 971, + 1872, + 275, + 2851, + 1398, + 1956, + 8073, + 1001, + 635, + 34207, + 368, + 47159, + 17338, + 2251, + 30027, + 18920, + 27105, + 2016, + 2983, + 20314, + 4163, + 517, + 2971, + 491, + 13, + 51039 + ], + "temperature": 0.0, + "avg_logprob": -0.08272041363662548, + "compression_ratio": 1.6818181818181819, + "no_speech_prob": 0.01115426979959011, + "confidence": 0.925, + "words": [ + { + "text": "On", + "start": 130.84, + "end": 131.06, + "confidence": 0.996 + }, + { + "text": "pouvait", + "start": 131.06, + "end": 131.26, + "confidence": 0.989 + }, + { + "text": "être", + "start": 131.26, + "end": 131.58, + "confidence": 0.995 + }, + { + "text": "énervé", + "start": 131.58, + "end": 132.22, + "confidence": 0.896 + }, + { + "text": "par", + "start": 132.22, + "end": 132.46, + "confidence": 0.992 + }, + { + "text": "son", + "start": 132.46, + "end": 132.72, + "confidence": 0.998 + }, + { + "text": "môme", + "start": 132.72, + "end": 133.08, + "confidence": 0.758 + }, + { + "text": "qui", + "start": 133.08, + "end": 133.34, + "confidence": 0.916 + }, + { + "text": "occupait", + "start": 133.34, + "end": 133.74, + "confidence": 0.992 + }, + { + "text": "la", + "start": 133.74, + "end": 133.86, + "confidence": 0.986 + }, + { + "text": "ligne", + "start": 133.86, + "end": 134.06, + "confidence": 0.999 + }, + { + "text": "de", + "start": 134.06, + "end": 134.22, + "confidence": 0.995 + }, + { + "text": "téléphone", + "start": 134.22, + "end": 134.6, + "confidence": 0.992 + }, + { + "text": "pendant", + "start": 134.6, + "end": 134.92, + "confidence": 0.709 + }, + { + "text": "une", + "start": 134.92, + "end": 135.16, + "confidence": 0.78 + }, + { + "text": "heure", + "start": 135.16, + "end": 135.34, + "confidence": 0.995 + }, + { + "text": "chaque", + "start": 135.34, + "end": 135.58, + "confidence": 0.982 + }, + { + "text": "soir", + "start": 135.58, + "end": 135.8, + "confidence": 0.995 + }, + { + "text": "pour", + "start": 135.8, + "end": 135.98, + "confidence": 0.66 + }, + { + "text": "discuter", + "start": 135.98, + "end": 136.3, + "confidence": 0.997 + }, + { + "text": "avec", + "start": 136.3, + "end": 136.5, + "confidence": 0.995 + }, + { + "text": "un", + "start": 136.5, + "end": 136.66, + "confidence": 0.997 + }, + { + "text": "copain.", + "start": 136.66, + "end": 136.88, + "confidence": 0.996 + } + ] + }, + { + "id": 29, + "seek": 12334, + "start": 137.26, + "end": 141.86, + "text": " Mais ça ne ressemblait pas à ce qu'on peut ressentir à voir ce même môme aujourd'hui,", + "tokens": [ + 51039, + 6313, + 2788, + 408, + 725, + 15750, + 35235, + 1736, + 1531, + 1769, + 421, + 6, + 266, + 5977, + 24689, + 317, + 347, + 1531, + 10695, + 1769, + 5698, + 275, + 2851, + 1398, + 14023, + 6, + 10556, + 11, + 51289 + ], + "temperature": 0.0, + "avg_logprob": -0.08272041363662548, + "compression_ratio": 1.6818181818181819, + "no_speech_prob": 0.01115426979959011, + "confidence": 0.956, + "words": [ + { + "text": "Mais", + "start": 137.26, + "end": 137.5, + "confidence": 0.989 + }, + { + "text": "ça", + "start": 137.5, + "end": 137.68, + "confidence": 0.928 + }, + { + "text": "ne", + "start": 137.68, + "end": 137.88, + "confidence": 0.999 + }, + { + "text": "ressemblait", + "start": 137.88, + "end": 138.42, + "confidence": 0.993 + }, + { + "text": "pas", + "start": 138.42, + "end": 138.78, + "confidence": 0.994 + }, + { + "text": "à", + "start": 138.78, + "end": 138.9, + "confidence": 0.989 + }, + { + "text": "ce", + "start": 138.9, + "end": 138.98, + "confidence": 0.998 + }, + { + "text": "qu'on", + "start": 138.98, + "end": 139.12, + "confidence": 0.976 + }, + { + "text": "peut", + "start": 139.12, + "end": 139.48, + "confidence": 0.979 + }, + { + "text": "ressentir", + "start": 139.48, + "end": 140.1, + "confidence": 0.996 + }, + { + "text": "à", + "start": 140.1, + "end": 140.32, + "confidence": 0.575 + }, + { + "text": "voir", + "start": 140.32, + "end": 140.46, + "confidence": 0.728 + }, + { + "text": "ce", + "start": 140.46, + "end": 140.7, + "confidence": 0.985 + }, + { + "text": "même", + "start": 140.7, + "end": 140.94, + "confidence": 0.982 + }, + { + "text": "môme", + "start": 140.94, + "end": 141.28, + "confidence": 0.997 + }, + { + "text": "aujourd'hui,", + "start": 141.28, + "end": 141.86, + "confidence": 0.994 + } + ] + }, + { + "id": 30, + "seek": 12334, + "start": 142.16, + "end": 144.22, + "text": " continuellement avec son smartphone dans la main,", + "tokens": [ + 51289, + 2354, + 285, + 1712, + 4163, + 1872, + 13307, + 2680, + 635, + 2135, + 11, + 51414 + ], + "temperature": 0.0, + "avg_logprob": -0.08272041363662548, + "compression_ratio": 1.6818181818181819, + "no_speech_prob": 0.01115426979959011, + "confidence": 0.961, + "words": [ + { + "text": "continuellement", + "start": 142.16, + "end": 142.94, + "confidence": 0.963 + }, + { + "text": "avec", + "start": 142.94, + "end": 143.2, + "confidence": 0.844 + }, + { + "text": "son", + "start": 143.2, + "end": 143.42, + "confidence": 0.994 + }, + { + "text": "smartphone", + "start": 143.42, + "end": 143.76, + "confidence": 0.972 + }, + { + "text": "dans", + "start": 143.76, + "end": 143.92, + "confidence": 0.963 + }, + { + "text": "la", + "start": 143.92, + "end": 144.02, + "confidence": 0.997 + }, + { + "text": "main,", + "start": 144.02, + "end": 144.22, + "confidence": 0.997 + } + ] + }, + { + "id": 31, + "seek": 12334, + "start": 144.34, + "end": 148.8, + "text": " comme si c'était une sorte de pacemaker externe, comme si le lâcher allait entraîner sa mort immédiate.", + "tokens": [ + 51414, + 5173, + 1511, + 269, + 6, + 9743, + 2251, + 25559, + 368, + 15165, + 49523, + 454, + 391, + 716, + 11, + 5173, + 1511, + 476, + 48835, + 6759, + 439, + 1001, + 22284, + 7517, + 1193, + 601, + 6599, + 3397, + 526, + 4504, + 473, + 13, + 51639 + ], + "temperature": 0.0, + "avg_logprob": -0.08272041363662548, + "compression_ratio": 1.6818181818181819, + "no_speech_prob": 0.01115426979959011, + "confidence": 0.973, + "words": [ + { + "text": "comme", + "start": 144.34, + "end": 144.56, + "confidence": 0.985 + }, + { + "text": "si", + "start": 144.56, + "end": 144.66, + "confidence": 0.971 + }, + { + "text": "c'était", + "start": 144.66, + "end": 144.86, + "confidence": 0.987 + }, + { + "text": "une", + "start": 144.86, + "end": 144.98, + "confidence": 0.983 + }, + { + "text": "sorte", + "start": 144.98, + "end": 145.14, + "confidence": 0.992 + }, + { + "text": "de", + "start": 145.14, + "end": 145.34, + "confidence": 0.989 + }, + { + "text": "pacemaker", + "start": 145.34, + "end": 145.82, + "confidence": 0.931 + }, + { + "text": "externe,", + "start": 145.82, + "end": 146.4, + "confidence": 0.99 + }, + { + "text": "comme", + "start": 146.44, + "end": 146.6, + "confidence": 0.721 + }, + { + "text": "si", + "start": 146.6, + "end": 146.74, + "confidence": 0.993 + }, + { + "text": "le", + "start": 146.74, + "end": 147.0, + "confidence": 0.996 + }, + { + "text": "lâcher", + "start": 147.0, + "end": 147.36, + "confidence": 0.968 + }, + { + "text": "allait", + "start": 147.36, + "end": 147.58, + "confidence": 0.991 + }, + { + "text": "entraîner", + "start": 147.58, + "end": 147.88, + "confidence": 0.982 + }, + { + "text": "sa", + "start": 147.88, + "end": 148.02, + "confidence": 0.999 + }, + { + "text": "mort", + "start": 148.02, + "end": 148.3, + "confidence": 0.998 + }, + { + "text": "immédiate.", + "start": 148.3, + "end": 148.8, + "confidence": 0.998 + } + ] + }, + { + "id": 32, + "seek": 12334, + "start": 148.94, + "end": 152.02, + "text": " Bon, je dis ça pour le môme, mais c'est évidemment valable pour nous aussi.", + "tokens": [ + 51639, + 7368, + 11, + 1506, + 717, + 2788, + 2016, + 476, + 275, + 2851, + 1398, + 11, + 2420, + 269, + 6, + 377, + 24724, + 1323, + 712, + 2016, + 4666, + 6212, + 13, + 51839 + ], + "temperature": 0.0, + "avg_logprob": -0.08272041363662548, + "compression_ratio": 1.6818181818181819, + "no_speech_prob": 0.01115426979959011, + "confidence": 0.973, + "words": [ + { + "text": "Bon,", + "start": 148.94, + "end": 149.24, + "confidence": 0.804 + }, + { + "text": "je", + "start": 149.26, + "end": 149.34, + "confidence": 0.933 + }, + { + "text": "dis", + "start": 149.34, + "end": 149.46, + "confidence": 0.982 + }, + { + "text": "ça", + "start": 149.46, + "end": 149.64, + "confidence": 0.992 + }, + { + "text": "pour", + "start": 149.64, + "end": 149.78, + "confidence": 0.997 + }, + { + "text": "le", + "start": 149.78, + "end": 149.9, + "confidence": 0.994 + }, + { + "text": "môme,", + "start": 149.9, + "end": 150.1, + "confidence": 0.999 + }, + { + "text": "mais", + "start": 150.32, + "end": 150.5, + "confidence": 0.904 + }, + { + "text": "c'est", + "start": 150.5, + "end": 150.84, + "confidence": 0.979 + }, + { + "text": "évidemment", + "start": 150.84, + "end": 151.18, + "confidence": 0.979 + }, + { + "text": "valable", + "start": 151.18, + "end": 151.48, + "confidence": 0.997 + }, + { + "text": "pour", + "start": 151.48, + "end": 151.64, + "confidence": 0.996 + }, + { + "text": "nous", + "start": 151.64, + "end": 151.78, + "confidence": 0.998 + }, + { + "text": "aussi.", + "start": 151.78, + "end": 152.02, + "confidence": 0.997 + } + ] + }, + { + "id": 33, + "seek": 15284, + "start": 153.14, + "end": 154.68, + "text": " Donc, rapport inédit, d'accord.", + "tokens": [ + 50389, + 7477, + 11, + 18018, + 294, + 7811, + 270, + 11, + 274, + 6, + 19947, + 13, + 50489 + ], + "temperature": 0.0, + "avg_logprob": -0.12394786888444928, + "compression_ratio": 1.6703296703296704, + "no_speech_prob": 0.07031125575304031, + "confidence": 0.813, + "words": [ + { + "text": "Donc,", + "start": 153.14, + "end": 153.24, + "confidence": 0.232 + }, + { + "text": "rapport", + "start": 153.26, + "end": 153.62, + "confidence": 0.855 + }, + { + "text": "inédit,", + "start": 153.62, + "end": 154.18, + "confidence": 0.992 + }, + { + "text": "d'accord.", + "start": 154.28, + "end": 154.68, + "confidence": 0.997 + } + ] + }, + { + "id": 34, + "seek": 15284, + "start": 155.64, + "end": 158.52, + "text": " Mais pourquoi a-t-on l'impression qu'on n'en sortira jamais ?", + "tokens": [ + 50489, + 6313, + 19934, + 257, + 12, + 83, + 12, + 266, + 287, + 6, + 36107, + 421, + 6, + 266, + 297, + 6, + 268, + 1333, + 4271, + 14540, + 2506, + 50639 + ], + "temperature": 0.0, + "avg_logprob": -0.12394786888444928, + "compression_ratio": 1.6703296703296704, + "no_speech_prob": 0.07031125575304031, + "confidence": 0.958, + "words": [ + { + "text": "Mais", + "start": 155.64, + "end": 155.88, + "confidence": 0.991 + }, + { + "text": "pourquoi", + "start": 155.88, + "end": 156.36, + "confidence": 0.992 + }, + { + "text": "a-t-on", + "start": 156.36, + "end": 156.7, + "confidence": 0.95 + }, + { + "text": "l'impression", + "start": 156.7, + "end": 157.06, + "confidence": 0.998 + }, + { + "text": "qu'on", + "start": 157.06, + "end": 157.28, + "confidence": 0.99 + }, + { + "text": "n'en", + "start": 157.28, + "end": 157.5, + "confidence": 0.859 + }, + { + "text": "sortira", + "start": 157.5, + "end": 157.86, + "confidence": 0.974 + }, + { + "text": "jamais ?", + "start": 157.86, + "end": 158.52, + "confidence": 0.997 + } + ] + }, + { + "id": 35, + "seek": 15284, + "start": 159.12, + "end": 165.36, + "text": " Est-ce qu'il faut en remettre la faute sur les gens qui ont créé cet outil merveilleux et diabolique, et diabolique parce que merveilleux ?", + "tokens": [ + 50639, + 4410, + 12, + 384, + 421, + 6, + 388, + 8487, + 465, + 890, + 40681, + 635, + 2050, + 1169, + 1022, + 1512, + 10668, + 1956, + 6592, + 15609, + 526, + 8603, + 484, + 388, + 3551, + 303, + 3409, + 2449, + 1030, + 1026, + 14923, + 1925, + 11, + 1030, + 1026, + 14923, + 1925, + 6992, + 631, + 3551, + 303, + 3409, + 2449, + 2506, + 50989 + ], + "temperature": 0.0, + "avg_logprob": -0.12394786888444928, + "compression_ratio": 1.6703296703296704, + "no_speech_prob": 0.07031125575304031, + "confidence": 0.959, + "words": [ + { + "text": "Est-ce", + "start": 159.12, + "end": 159.34, + "confidence": 0.987 + }, + { + "text": "qu'il", + "start": 159.34, + "end": 159.46, + "confidence": 0.993 + }, + { + "text": "faut", + "start": 159.46, + "end": 159.64, + "confidence": 0.998 + }, + { + "text": "en", + "start": 159.64, + "end": 159.88, + "confidence": 0.961 + }, + { + "text": "remettre", + "start": 159.88, + "end": 160.14, + "confidence": 0.999 + }, + { + "text": "la", + "start": 160.14, + "end": 160.46, + "confidence": 0.995 + }, + { + "text": "faute", + "start": 160.46, + "end": 160.64, + "confidence": 0.986 + }, + { + "text": "sur", + "start": 160.64, + "end": 161.06, + "confidence": 0.982 + }, + { + "text": "les", + "start": 161.06, + "end": 161.3, + "confidence": 0.991 + }, + { + "text": "gens", + "start": 161.3, + "end": 161.46, + "confidence": 0.998 + }, + { + "text": "qui", + "start": 161.46, + "end": 161.56, + "confidence": 0.724 + }, + { + "text": "ont", + "start": 161.56, + "end": 161.82, + "confidence": 0.996 + }, + { + "text": "créé", + "start": 161.82, + "end": 162.28, + "confidence": 0.985 + }, + { + "text": "cet", + "start": 162.28, + "end": 162.48, + "confidence": 0.816 + }, + { + "text": "outil", + "start": 162.48, + "end": 162.78, + "confidence": 0.993 + }, + { + "text": "merveilleux", + "start": 162.78, + "end": 163.36, + "confidence": 0.981 + }, + { + "text": "et", + "start": 163.36, + "end": 163.5, + "confidence": 0.983 + }, + { + "text": "diabolique,", + "start": 163.5, + "end": 163.84, + "confidence": 0.991 + }, + { + "text": "et", + "start": 163.86, + "end": 164.0, + "confidence": 0.555 + }, + { + "text": "diabolique", + "start": 164.0, + "end": 164.4, + "confidence": 0.949 + }, + { + "text": "parce", + "start": 164.4, + "end": 164.66, + "confidence": 0.927 + }, + { + "text": "que", + "start": 164.66, + "end": 164.86, + "confidence": 0.979 + }, + { + "text": "merveilleux ?", + "start": 164.86, + "end": 165.36, + "confidence": 0.997 + } + ] + }, + { + "id": 36, + "seek": 15284, + "start": 166.84, + "end": 168.82, + "text": " Les économistes parlent de dépendance du sentier.", + "tokens": [ + 51039, + 6965, + 31171, + 22368, + 13734, + 317, + 368, + 45768, + 719, + 1581, + 2279, + 811, + 13, + 51139 + ], + "temperature": 0.0, + "avg_logprob": -0.12394786888444928, + "compression_ratio": 1.6703296703296704, + "no_speech_prob": 0.07031125575304031, + "confidence": 0.986, + "words": [ + { + "text": "Les", + "start": 166.84, + "end": 167.08, + "confidence": 0.945 + }, + { + "text": "économistes", + "start": 167.08, + "end": 167.46, + "confidence": 0.997 + }, + { + "text": "parlent", + "start": 167.46, + "end": 167.72, + "confidence": 0.993 + }, + { + "text": "de", + "start": 167.72, + "end": 167.88, + "confidence": 0.992 + }, + { + "text": "dépendance", + "start": 167.88, + "end": 168.34, + "confidence": 0.986 + }, + { + "text": "du", + "start": 168.34, + "end": 168.52, + "confidence": 0.996 + }, + { + "text": "sentier.", + "start": 168.52, + "end": 168.82, + "confidence": 0.983 + } + ] + }, + { + "id": 37, + "seek": 15284, + "start": 168.98, + "end": 177.38, + "text": " C'est l'idée qu'on met sur un sentier qui a été établi, soit volontairement en marchant dessus, soit en définissant des bornes, en définissant une signalétique.", + "tokens": [ + 51139, + 383, + 6, + 377, + 287, + 6, + 34281, + 421, + 6, + 266, + 1131, + 1022, + 517, + 2279, + 811, + 1956, + 257, + 8862, + 4823, + 455, + 2081, + 11, + 12703, + 40005, + 9020, + 518, + 465, + 8368, + 394, + 30677, + 11, + 12703, + 465, + 40763, + 29492, + 730, + 4232, + 279, + 11, + 465, + 40763, + 29492, + 2251, + 6358, + 42379, + 13, + 51589 + ], + "temperature": 0.0, + "avg_logprob": -0.12394786888444928, + "compression_ratio": 1.6703296703296704, + "no_speech_prob": 0.07031125575304031, + "confidence": 0.907, + "words": [ + { + "text": "C'est", + "start": 168.98, + "end": 169.2, + "confidence": 0.996 + }, + { + "text": "l'idée", + "start": 169.2, + "end": 169.38, + "confidence": 0.998 + }, + { + "text": "qu'on", + "start": 169.38, + "end": 169.74, + "confidence": 0.7 + }, + { + "text": "met", + "start": 169.74, + "end": 169.88, + "confidence": 0.648 + }, + { + "text": "sur", + "start": 169.88, + "end": 170.1, + "confidence": 0.995 + }, + { + "text": "un", + "start": 170.1, + "end": 170.52, + "confidence": 0.997 + }, + { + "text": "sentier", + "start": 170.52, + "end": 170.84, + "confidence": 0.991 + }, + { + "text": "qui", + "start": 170.84, + "end": 170.9, + "confidence": 0.955 + }, + { + "text": "a", + "start": 170.9, + "end": 171.0, + "confidence": 0.969 + }, + { + "text": "été", + "start": 171.0, + "end": 171.14, + "confidence": 0.994 + }, + { + "text": "établi,", + "start": 171.14, + "end": 171.5, + "confidence": 0.995 + }, + { + "text": "soit", + "start": 171.76, + "end": 172.1, + "confidence": 0.527 + }, + { + "text": "volontairement", + "start": 172.1, + "end": 172.7, + "confidence": 0.987 + }, + { + "text": "en", + "start": 172.7, + "end": 172.86, + "confidence": 0.927 + }, + { + "text": "marchant", + "start": 172.86, + "end": 173.1, + "confidence": 0.997 + }, + { + "text": "dessus,", + "start": 173.1, + "end": 173.48, + "confidence": 0.995 + }, + { + "text": "soit", + "start": 173.86, + "end": 174.28, + "confidence": 0.749 + }, + { + "text": "en", + "start": 174.28, + "end": 175.16, + "confidence": 0.967 + }, + { + "text": "définissant", + "start": 175.16, + "end": 175.54, + "confidence": 0.981 + }, + { + "text": "des", + "start": 175.54, + "end": 175.74, + "confidence": 0.99 + }, + { + "text": "bornes,", + "start": 175.74, + "end": 175.98, + "confidence": 0.977 + }, + { + "text": "en", + "start": 176.04, + "end": 176.14, + "confidence": 0.673 + }, + { + "text": "définissant", + "start": 176.14, + "end": 176.66, + "confidence": 0.996 + }, + { + "text": "une", + "start": 176.66, + "end": 176.94, + "confidence": 0.983 + }, + { + "text": "signalétique.", + "start": 176.94, + "end": 177.38, + "confidence": 0.686 + } + ] + } + ], + "language": "fr", + "language_probs": { + "en": 0.001014346838928759, + "zh": 5.72255376027897e-05, + "de": 9.583473729435354e-05, + "es": 0.00010201553959632292, + "ru": 3.111298428848386e-05, + "ko": 5.633833643514663e-05, + "fr": 0.9971188306808472, + "ja": 0.00011926825391128659, + "pt": 0.00024857642711140215, + "tr": 3.111298428848386e-05, + "pl": 0.00016302037693094462, + "ca": 4.259047159393958e-08, + "nl": 1.5644591258023866e-05, + "ar": 9.288621367886662e-05, + "sv": 2.0521238184301183e-06, + "it": 0.0006971497205086052, + "id": 2.9227943741716444e-05, + "hi": 3.2284438020724338e-06, + "fi": 8.965064921540034e-07, + "vi": 5.546489046537317e-05, + "he": 5.610194193650386e-07, + "uk": 1.0875857014980284e-07, + "el": 4.624531811714405e-06, + "ms": 2.939531441370491e-06, + "cs": 1.2841862826462602e-06, + "ro": 3.4907800454675453e-06, + "da": 7.956947456477792e-08, + "hu": 5.322803644958185e-06, + "ta": 2.338676807767115e-07, + "no": 1.1047126236007898e-07, + "th": 6.222988304216415e-06, + "ur": 2.0003761846965062e-07, + "hr": 1.4044846174954273e-08, + "bg": 1.846160024854271e-08, + "lt": 2.347129157698191e-09, + "la": 5.8459563661017455e-06, + "mi": 1.850045805440459e-07, + "ml": 6.357183224281471e-07, + "cy": 2.3619797957508126e-06, + "sk": 3.265524739504144e-08, + "te": 2.7931511326073633e-08, + "fa": 1.1577289171782468e-07, + "lv": 2.3058872866688063e-10, + "bn": 5.300469752000936e-08, + "sr": 2.1831703111985235e-10, + "az": 5.115834977864608e-10, + "sl": 3.4222402689465525e-08, + "kn": 2.287942890699668e-10, + "et": 1.0830222274549328e-09, + "mk": 1.6351191234331708e-10, + "br": 5.406625859905034e-06, + "eu": 3.817784843818117e-08, + "is": 9.191490346616149e-10, + "hy": 2.2396462462381805e-09, + "ne": 5.289337856595466e-09, + "mn": 6.634315763420773e-09, + "bs": 3.415052907129734e-09, + "kk": 1.0393448601764277e-10, + "sq": 3.3289374035128105e-10, + "sw": 3.530873726731443e-08, + "gl": 1.509963283297111e-07, + "mr": 1.1710261649255926e-09, + "pa": 1.961099949099321e-09, + "si": 6.805937857734534e-08, + "km": 3.7744330256828107e-06, + "sn": 1.7379569783315674e-07, + "yo": 1.9047636357072406e-08, + "so": 1.3956540784176852e-11, + "af": 7.740010854462298e-10, + "oc": 2.734190331921127e-07, + "ka": 2.9087926511905948e-11, + "be": 2.279703537055866e-08, + "tg": 3.669336102324339e-12, + "sd": 1.1528712429154098e-09, + "gu": 1.3769081708137065e-10, + "am": 8.416871366545564e-11, + "yi": 9.784290044834165e-10, + "lo": 2.809145804860691e-09, + "uz": 5.235589739527313e-12, + "fo": 1.6905737920680508e-09, + "ht": 4.75131045618582e-08, + "ps": 2.007606081377844e-09, + "tk": 2.44944915045453e-11, + "nn": 1.7182223018608056e-05, + "mt": 3.048388971804705e-11, + "sa": 2.338676807767115e-07, + "lb": 6.963176563123952e-12, + "my": 3.0676766016313195e-08, + "bo": 1.2688460948595548e-08, + "tl": 3.4027550555038033e-07, + "mg": 3.001127818480498e-11, + "as": 2.7169991256847936e-10, + "tt": 5.143594426250397e-13, + "haw": 8.965064921540034e-07, + "ln": 1.041532304846271e-09, + "ha": 8.9408957668069e-12, + "ba": 2.775589653947197e-11, + "jw": 2.3991756279428955e-06, + "su": 2.425283281495827e-12 + } +} \ No newline at end of file diff --git a/tests/expected/medium_fr.cpu/radio_short.mp3.words.json b/tests/expected/medium_fr.cpu/radio_short.mp3.words.json new file mode 100644 index 0000000000000000000000000000000000000000..55a81cf3b19c05b84cbe3d2f0fc3db1d81a0f42e --- /dev/null +++ b/tests/expected/medium_fr.cpu/radio_short.mp3.words.json @@ -0,0 +1,1977 @@ +{ + "text": " Le plus important au poker ce ne sont pas les cartes, c'est ce que vous en faites. Winamax, la référence du poker en ligne. Bonsoir à toutes et tous, vous êtes sur BFM TV, nous sommes en direct, c'est bien sûr BFM story avec tout ce qui fait l'actualité. Durant 60 minutes ce sont des gros plans, des analyses, des réactions que nous vous proposons. Comment Eric Verth peut-il encore soutenir la réforme des retraites alors qu'il est englué dans sa propre affaire, l'affaire Verth-Bettancourt? Question posée par les leaders de la CFDT et la CGT. Réponse de Nicolas Sarkozy, Eric Verth portera le débat sur les retraites, on en parle dans BFM story avec le numéro de la CFDT. Et puis il y a une bataille qui a démarré, celle entre Marine Le Pen et Bruno Gognich, la bataille de la succession de Jean-Marie Le Pen à la tête du Front National. La tournée de campagne de Marine Le Pen commence aujourd'hui dans le Var, Marine Le Pen sera en direct dans BFM story. Restez avec nous Marine Le Pen dans moins de 3 minutes, à tout de suite. Musique L'actualité c'est aussi aujourd'hui un dernier adieu, dernier adieu à Laurent Fignon, c'était au cimetière du Père Lachaise à Paris. L'ancien double vainqueur du Tour de France, vaincu par le cancer à 50 ans, a été incinéré en petit comité aujourd'hui.", + "segments": [ + { + "id": 0, + "seek": 3000, + "start": 30.86, + "end": 34.26, + "text": " Le plus important au poker ce ne sont pas les cartes, c'est ce que vous en faites.", + "tokens": [ + 1456, + 1804, + 1021, + 1609, + 36863, + 1769, + 408, + 4900, + 1736, + 1512, + 5467, + 279, + 11, + 269, + 6, + 377, + 1769, + 631, + 2630, + 465, + 29902, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.1935427300283842, + "compression_ratio": 1.5084745762711864, + "no_speech_prob": 0.5593915581703186, + "confidence": 0.92, + "words": [ + { + "text": "Le", + "start": 30.86, + "end": 31.02, + "confidence": 0.535 + }, + { + "text": "plus", + "start": 31.02, + "end": 31.12, + "confidence": 0.99 + }, + { + "text": "important", + "start": 31.12, + "end": 31.48, + "confidence": 0.993 + }, + { + "text": "au", + "start": 31.48, + "end": 31.64, + "confidence": 0.946 + }, + { + "text": "poker", + "start": 31.64, + "end": 31.84, + "confidence": 0.992 + }, + { + "text": "ce", + "start": 31.84, + "end": 32.02, + "confidence": 0.581 + }, + { + "text": "ne", + "start": 32.02, + "end": 32.06, + "confidence": 0.961 + }, + { + "text": "sont", + "start": 32.06, + "end": 32.16, + "confidence": 0.991 + }, + { + "text": "pas", + "start": 32.16, + "end": 32.28, + "confidence": 0.991 + }, + { + "text": "les", + "start": 32.28, + "end": 32.42, + "confidence": 0.969 + }, + { + "text": "cartes,", + "start": 32.42, + "end": 33.56, + "confidence": 0.996 + }, + { + "text": "c'est", + "start": 33.56, + "end": 33.62, + "confidence": 0.95 + }, + { + "text": "ce", + "start": 33.62, + "end": 33.66, + "confidence": 0.99 + }, + { + "text": "que", + "start": 33.66, + "end": 33.7, + "confidence": 0.991 + }, + { + "text": "vous", + "start": 33.7, + "end": 33.86, + "confidence": 0.991 + }, + { + "text": "en", + "start": 33.86, + "end": 34.04, + "confidence": 0.982 + }, + { + "text": "faites.", + "start": 34.04, + "end": 34.26, + "confidence": 0.894 + } + ] + }, + { + "id": 1, + "seek": 3000, + "start": 36.18, + "end": 38.76, + "text": " Winamax, la référence du poker en ligne.", + "tokens": [ + 10427, + 2404, + 87, + 11, + 635, + 30170, + 41635, + 1581, + 36863, + 465, + 34207, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.1935427300283842, + "compression_ratio": 1.5084745762711864, + "no_speech_prob": 0.5593915581703186, + "confidence": 0.967, + "words": [ + { + "text": "Winamax,", + "start": 36.18, + "end": 37.28, + "confidence": 0.905 + }, + { + "text": "la", + "start": 37.28, + "end": 37.32, + "confidence": 0.988 + }, + { + "text": "référence", + "start": 37.32, + "end": 37.78, + "confidence": 0.998 + }, + { + "text": "du", + "start": 37.78, + "end": 37.96, + "confidence": 0.992 + }, + { + "text": "poker", + "start": 37.96, + "end": 38.22, + "confidence": 0.998 + }, + { + "text": "en", + "start": 38.22, + "end": 38.4, + "confidence": 0.993 + }, + { + "text": "ligne.", + "start": 38.4, + "end": 38.76, + "confidence": 0.993 + } + ] + }, + { + "id": 2, + "seek": 3000, + "start": 44.94, + "end": 51.38, + "text": " Bonsoir à toutes et tous, vous êtes sur BFM TV, nous sommes en direct, c'est bien sûr BFM story avec tout ce qui fait l'actualité.", + "tokens": [ + 7368, + 539, + 347, + 1531, + 14437, + 1030, + 8317, + 11, + 2630, + 18935, + 1022, + 363, + 37, + 44, + 3558, + 11, + 4666, + 25232, + 465, + 2047, + 11, + 269, + 6, + 377, + 3610, + 18143, + 363, + 37, + 44, + 1657, + 4163, + 3486, + 1769, + 1956, + 3887, + 287, + 6, + 578, + 901, + 5066, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.1935427300283842, + "compression_ratio": 1.5084745762711864, + "no_speech_prob": 0.5593915581703186, + "confidence": 0.907, + "words": [ + { + "text": "Bonsoir", + "start": 44.94, + "end": 45.4, + "confidence": 0.955 + }, + { + "text": "à", + "start": 45.4, + "end": 45.84, + "confidence": 0.54 + }, + { + "text": "toutes", + "start": 45.84, + "end": 46.06, + "confidence": 0.917 + }, + { + "text": "et", + "start": 46.06, + "end": 46.14, + "confidence": 0.988 + }, + { + "text": "tous,", + "start": 46.14, + "end": 46.7, + "confidence": 0.981 + }, + { + "text": "vous", + "start": 46.7, + "end": 46.74, + "confidence": 0.97 + }, + { + "text": "êtes", + "start": 46.74, + "end": 46.9, + "confidence": 0.995 + }, + { + "text": "sur", + "start": 46.9, + "end": 47.04, + "confidence": 0.989 + }, + { + "text": "BFM", + "start": 47.04, + "end": 47.56, + "confidence": 0.987 + }, + { + "text": "TV,", + "start": 47.56, + "end": 47.88, + "confidence": 0.853 + }, + { + "text": "nous", + "start": 47.88, + "end": 47.92, + "confidence": 0.829 + }, + { + "text": "sommes", + "start": 47.92, + "end": 48.14, + "confidence": 0.988 + }, + { + "text": "en", + "start": 48.14, + "end": 48.2, + "confidence": 0.986 + }, + { + "text": "direct,", + "start": 48.2, + "end": 48.74, + "confidence": 0.998 + }, + { + "text": "c'est", + "start": 48.74, + "end": 48.8, + "confidence": 0.939 + }, + { + "text": "bien", + "start": 48.8, + "end": 48.94, + "confidence": 0.971 + }, + { + "text": "sûr", + "start": 48.94, + "end": 49.2, + "confidence": 0.906 + }, + { + "text": "BFM", + "start": 49.2, + "end": 49.84, + "confidence": 0.95 + }, + { + "text": "story", + "start": 49.84, + "end": 50.04, + "confidence": 0.356 + }, + { + "text": "avec", + "start": 50.04, + "end": 50.24, + "confidence": 0.553 + }, + { + "text": "tout", + "start": 50.24, + "end": 50.42, + "confidence": 0.93 + }, + { + "text": "ce", + "start": 50.42, + "end": 50.46, + "confidence": 0.995 + }, + { + "text": "qui", + "start": 50.46, + "end": 50.56, + "confidence": 0.952 + }, + { + "text": "fait", + "start": 50.56, + "end": 50.72, + "confidence": 0.961 + }, + { + "text": "l'actualité.", + "start": 50.72, + "end": 51.38, + "confidence": 0.994 + } + ] + }, + { + "id": 3, + "seek": 3000, + "start": 51.5, + "end": 56.11, + "text": " Durant 60 minutes ce sont des gros plans, des analyses, des réactions que nous vous proposons.", + "tokens": [ + 13710, + 394, + 4060, + 2077, + 1769, + 4900, + 730, + 18638, + 5482, + 11, + 730, + 37560, + 11, + 730, + 3960, + 12299, + 631, + 4666, + 2630, + 7532, + 892, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.1935427300283842, + "compression_ratio": 1.5084745762711864, + "no_speech_prob": 0.5593915581703186, + "confidence": 0.947, + "words": [ + { + "text": "Durant", + "start": 51.5, + "end": 52.3, + "confidence": 0.935 + }, + { + "text": "60", + "start": 52.3, + "end": 52.7, + "confidence": 0.922 + }, + { + "text": "minutes", + "start": 52.7, + "end": 53.08, + "confidence": 0.912 + }, + { + "text": "ce", + "start": 53.08, + "end": 53.26, + "confidence": 0.752 + }, + { + "text": "sont", + "start": 53.26, + "end": 53.58, + "confidence": 0.979 + }, + { + "text": "des", + "start": 53.58, + "end": 53.86, + "confidence": 0.99 + }, + { + "text": "gros", + "start": 53.86, + "end": 54.02, + "confidence": 0.969 + }, + { + "text": "plans,", + "start": 54.02, + "end": 54.32, + "confidence": 0.958 + }, + { + "text": "des", + "start": 54.32, + "end": 54.44, + "confidence": 0.986 + }, + { + "text": "analyses,", + "start": 54.44, + "end": 54.78, + "confidence": 0.913 + }, + { + "text": "des", + "start": 54.78, + "end": 54.86, + "confidence": 0.995 + }, + { + "text": "réactions", + "start": 54.86, + "end": 55.22, + "confidence": 0.996 + }, + { + "text": "que", + "start": 55.22, + "end": 55.4, + "confidence": 0.882 + }, + { + "text": "nous", + "start": 55.4, + "end": 55.54, + "confidence": 0.947 + }, + { + "text": "vous", + "start": 55.54, + "end": 55.64, + "confidence": 0.99 + }, + { + "text": "proposons.", + "start": 55.64, + "end": 56.11, + "confidence": 0.991 + } + ] + }, + { + "id": 4, + "seek": 5600, + "start": 56.11, + "end": 63.98, + "text": " Comment Eric Verth peut-il encore soutenir la réforme des retraites alors qu'il est englué dans sa propre affaire, l'affaire Verth-Bettancourt?", + "tokens": [ + 16328, + 9336, + 4281, + 392, + 5977, + 12, + 388, + 10122, + 29350, + 268, + 347, + 635, + 3960, + 44562, + 730, + 49356, + 3324, + 11246, + 421, + 6, + 388, + 871, + 1741, + 2781, + 526, + 2680, + 601, + 35221, + 2096, + 9020, + 11, + 287, + 6, + 2518, + 9020, + 4281, + 392, + 12, + 33, + 3093, + 4463, + 33403, + 2506 + ], + "temperature": 0.0, + "avg_logprob": -0.12757631117297757, + "compression_ratio": 1.5705329153605017, + "no_speech_prob": 6.333013880066574e-05, + "confidence": 0.858, + "words": [ + { + "text": "Comment", + "start": 56.11, + "end": 56.94, + "confidence": 0.966 + }, + { + "text": "Eric", + "start": 56.94, + "end": 57.2, + "confidence": 0.888 + }, + { + "text": "Verth", + "start": 57.2, + "end": 57.36, + "confidence": 0.376 + }, + { + "text": "peut-il", + "start": 57.36, + "end": 57.8, + "confidence": 0.951 + }, + { + "text": "encore", + "start": 57.8, + "end": 58.36, + "confidence": 0.971 + }, + { + "text": "soutenir", + "start": 58.36, + "end": 58.62, + "confidence": 0.997 + }, + { + "text": "la", + "start": 58.62, + "end": 58.72, + "confidence": 0.98 + }, + { + "text": "réforme", + "start": 58.72, + "end": 59.18, + "confidence": 0.996 + }, + { + "text": "des", + "start": 59.18, + "end": 59.38, + "confidence": 0.994 + }, + { + "text": "retraites", + "start": 59.38, + "end": 59.78, + "confidence": 0.988 + }, + { + "text": "alors", + "start": 59.78, + "end": 59.94, + "confidence": 0.508 + }, + { + "text": "qu'il", + "start": 59.94, + "end": 60.72, + "confidence": 0.965 + }, + { + "text": "est", + "start": 60.72, + "end": 60.86, + "confidence": 0.975 + }, + { + "text": "englué", + "start": 60.86, + "end": 61.74, + "confidence": 0.945 + }, + { + "text": "dans", + "start": 61.74, + "end": 61.92, + "confidence": 0.97 + }, + { + "text": "sa", + "start": 61.92, + "end": 62.42, + "confidence": 0.871 + }, + { + "text": "propre", + "start": 62.42, + "end": 62.74, + "confidence": 0.992 + }, + { + "text": "affaire,", + "start": 62.74, + "end": 62.98, + "confidence": 0.993 + }, + { + "text": "l'affaire", + "start": 62.98, + "end": 63.24, + "confidence": 0.903 + }, + { + "text": "Verth-Bettancourt?", + "start": 63.24, + "end": 63.98, + "confidence": 0.714 + } + ] + }, + { + "id": 5, + "seek": 5600, + "start": 64.0, + "end": 67.18, + "text": " Question posée par les leaders de la CFDT et la CGT.", + "tokens": [ + 14464, + 1366, + 3856, + 971, + 1512, + 3523, + 368, + 635, + 21792, + 35, + 51, + 1030, + 635, + 38007, + 51, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.12757631117297757, + "compression_ratio": 1.5705329153605017, + "no_speech_prob": 6.333013880066574e-05, + "confidence": 0.896, + "words": [ + { + "text": "Question", + "start": 64.0, + "end": 64.3, + "confidence": 0.639 + }, + { + "text": "posée", + "start": 64.3, + "end": 64.76, + "confidence": 0.977 + }, + { + "text": "par", + "start": 64.76, + "end": 64.94, + "confidence": 0.989 + }, + { + "text": "les", + "start": 64.94, + "end": 65.08, + "confidence": 0.966 + }, + { + "text": "leaders", + "start": 65.08, + "end": 65.66, + "confidence": 0.977 + }, + { + "text": "de", + "start": 65.66, + "end": 65.9, + "confidence": 0.988 + }, + { + "text": "la", + "start": 65.9, + "end": 66.1, + "confidence": 0.967 + }, + { + "text": "CFDT", + "start": 66.1, + "end": 66.54, + "confidence": 0.994 + }, + { + "text": "et", + "start": 66.54, + "end": 66.62, + "confidence": 0.586 + }, + { + "text": "la", + "start": 66.62, + "end": 66.66, + "confidence": 0.627 + }, + { + "text": "CGT.", + "start": 66.66, + "end": 67.18, + "confidence": 0.987 + } + ] + }, + { + "id": 6, + "seek": 5600, + "start": 67.44, + "end": 76.42, + "text": " Réponse de Nicolas Sarkozy, Eric Verth portera le débat sur les retraites, on en parle dans BFM story avec le numéro de la CFDT.", + "tokens": [ + 41587, + 3739, + 368, + 38268, + 318, + 809, + 78, + 1229, + 11, + 9336, + 4281, + 392, + 1515, + 23833, + 476, + 2795, + 11980, + 1022, + 1512, + 49356, + 3324, + 11, + 322, + 465, + 18508, + 2680, + 363, + 37, + 44, + 1657, + 4163, + 476, + 49525, + 368, + 635, + 21792, + 35, + 51, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.12757631117297757, + "compression_ratio": 1.5705329153605017, + "no_speech_prob": 6.333013880066574e-05, + "confidence": 0.968, + "words": [ + { + "text": "Réponse", + "start": 67.44, + "end": 67.94, + "confidence": 0.957 + }, + { + "text": "de", + "start": 67.94, + "end": 68.1, + "confidence": 0.966 + }, + { + "text": "Nicolas", + "start": 68.1, + "end": 68.36, + "confidence": 0.934 + }, + { + "text": "Sarkozy,", + "start": 68.36, + "end": 69.06, + "confidence": 0.988 + }, + { + "text": "Eric", + "start": 69.06, + "end": 69.24, + "confidence": 0.962 + }, + { + "text": "Verth", + "start": 69.24, + "end": 69.8, + "confidence": 0.988 + }, + { + "text": "portera", + "start": 69.8, + "end": 70.64, + "confidence": 0.966 + }, + { + "text": "le", + "start": 70.64, + "end": 71.0, + "confidence": 0.99 + }, + { + "text": "débat", + "start": 71.0, + "end": 71.4, + "confidence": 0.996 + }, + { + "text": "sur", + "start": 71.4, + "end": 71.66, + "confidence": 0.99 + }, + { + "text": "les", + "start": 71.66, + "end": 71.82, + "confidence": 0.997 + }, + { + "text": "retraites,", + "start": 71.82, + "end": 72.34, + "confidence": 0.996 + }, + { + "text": "on", + "start": 72.34, + "end": 72.46, + "confidence": 0.842 + }, + { + "text": "en", + "start": 72.46, + "end": 72.74, + "confidence": 0.948 + }, + { + "text": "parle", + "start": 72.74, + "end": 72.92, + "confidence": 0.996 + }, + { + "text": "dans", + "start": 72.92, + "end": 73.42, + "confidence": 0.983 + }, + { + "text": "BFM", + "start": 73.42, + "end": 74.6, + "confidence": 0.992 + }, + { + "text": "story", + "start": 74.6, + "end": 74.7, + "confidence": 0.756 + }, + { + "text": "avec", + "start": 74.7, + "end": 75.08, + "confidence": 0.837 + }, + { + "text": "le", + "start": 75.08, + "end": 75.26, + "confidence": 0.984 + }, + { + "text": "numéro", + "start": 75.26, + "end": 75.52, + "confidence": 0.997 + }, + { + "text": "de", + "start": 75.52, + "end": 75.76, + "confidence": 0.996 + }, + { + "text": "la", + "start": 75.76, + "end": 75.9, + "confidence": 0.99 + }, + { + "text": "CFDT.", + "start": 75.9, + "end": 76.42, + "confidence": 0.998 + } + ] + }, + { + "id": 7, + "seek": 5600, + "start": 76.5, + "end": 83.0, + "text": " Et puis il y a une bataille qui a démarré, celle entre Marine Le Pen et Bruno Gognich, la bataille de la succession de Jean-Marie Le Pen à la tête du Front National.", + "tokens": [ + 3790, + 9093, + 1930, + 288, + 257, + 2251, + 272, + 3274, + 3409, + 1956, + 257, + 22761, + 2284, + 526, + 11, + 25722, + 3962, + 20415, + 1456, + 10571, + 1030, + 23046, + 460, + 2912, + 480, + 11, + 635, + 272, + 3274, + 3409, + 368, + 635, + 36624, + 368, + 13854, + 12, + 16639, + 414, + 1456, + 10571, + 1531, + 635, + 24661, + 1581, + 17348, + 4862, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.12757631117297757, + "compression_ratio": 1.5705329153605017, + "no_speech_prob": 6.333013880066574e-05, + "confidence": 0.872, + "words": [ + { + "text": "Et", + "start": 76.5, + "end": 76.96, + "confidence": 0.912 + }, + { + "text": "puis", + "start": 76.96, + "end": 77.08, + "confidence": 0.958 + }, + { + "text": "il", + "start": 77.08, + "end": 77.14, + "confidence": 0.794 + }, + { + "text": "y", + "start": 77.14, + "end": 77.18, + "confidence": 0.994 + }, + { + "text": "a", + "start": 77.18, + "end": 77.22, + "confidence": 0.986 + }, + { + "text": "une", + "start": 77.22, + "end": 77.3, + "confidence": 0.996 + }, + { + "text": "bataille", + "start": 77.3, + "end": 77.56, + "confidence": 0.996 + }, + { + "text": "qui", + "start": 77.56, + "end": 77.68, + "confidence": 0.997 + }, + { + "text": "a", + "start": 77.68, + "end": 77.72, + "confidence": 0.985 + }, + { + "text": "démarré,", + "start": 77.72, + "end": 78.16, + "confidence": 0.987 + }, + { + "text": "celle", + "start": 78.16, + "end": 78.38, + "confidence": 0.997 + }, + { + "text": "entre", + "start": 78.38, + "end": 78.64, + "confidence": 0.976 + }, + { + "text": "Marine", + "start": 78.64, + "end": 78.96, + "confidence": 0.987 + }, + { + "text": "Le", + "start": 78.96, + "end": 79.12, + "confidence": 0.986 + }, + { + "text": "Pen", + "start": 79.12, + "end": 79.16, + "confidence": 0.987 + }, + { + "text": "et", + "start": 79.16, + "end": 79.32, + "confidence": 0.997 + }, + { + "text": "Bruno", + "start": 79.32, + "end": 79.54, + "confidence": 0.986 + }, + { + "text": "Gognich,", + "start": 79.54, + "end": 80.2, + "confidence": 0.24 + }, + { + "text": "la", + "start": 80.2, + "end": 80.32, + "confidence": 0.676 + }, + { + "text": "bataille", + "start": 80.32, + "end": 80.54, + "confidence": 0.998 + }, + { + "text": "de", + "start": 80.54, + "end": 80.72, + "confidence": 0.975 + }, + { + "text": "la", + "start": 80.72, + "end": 80.92, + "confidence": 0.988 + }, + { + "text": "succession", + "start": 80.92, + "end": 81.18, + "confidence": 0.983 + }, + { + "text": "de", + "start": 81.18, + "end": 81.44, + "confidence": 0.984 + }, + { + "text": "Jean-Marie", + "start": 81.44, + "end": 81.7, + "confidence": 0.95 + }, + { + "text": "Le", + "start": 81.7, + "end": 81.94, + "confidence": 0.996 + }, + { + "text": "Pen", + "start": 81.94, + "end": 81.98, + "confidence": 0.999 + }, + { + "text": "à", + "start": 81.98, + "end": 82.12, + "confidence": 0.976 + }, + { + "text": "la", + "start": 82.12, + "end": 82.28, + "confidence": 0.995 + }, + { + "text": "tête", + "start": 82.28, + "end": 82.32, + "confidence": 0.926 + }, + { + "text": "du", + "start": 82.32, + "end": 82.48, + "confidence": 0.997 + }, + { + "text": "Front", + "start": 82.48, + "end": 82.64, + "confidence": 0.775 + }, + { + "text": "National.", + "start": 82.64, + "end": 83.0, + "confidence": 0.836 + } + ] + }, + { + "id": 8, + "seek": 8300, + "start": 83.3, + "end": 88.82, + "text": " La tournée de campagne de Marine Le Pen commence aujourd'hui dans le Var, Marine Le Pen sera en direct dans BFM story.", + "tokens": [ + 2369, + 3512, + 77, + 3856, + 368, + 2255, + 13887, + 368, + 20415, + 1456, + 10571, + 18137, + 14023, + 6, + 10556, + 2680, + 476, + 14662, + 11, + 20415, + 1456, + 10571, + 15021, + 465, + 2047, + 2680, + 363, + 37, + 44, + 1657, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.10741670781915838, + "compression_ratio": 1.3591549295774648, + "no_speech_prob": 0.00011412434105295688, + "confidence": 0.958, + "words": [ + { + "text": "La", + "start": 83.3, + "end": 83.56, + "confidence": 0.98 + }, + { + "text": "tournée", + "start": 83.56, + "end": 84.14, + "confidence": 0.995 + }, + { + "text": "de", + "start": 84.14, + "end": 84.36, + "confidence": 0.947 + }, + { + "text": "campagne", + "start": 84.36, + "end": 84.84, + "confidence": 0.984 + }, + { + "text": "de", + "start": 84.84, + "end": 84.9, + "confidence": 0.977 + }, + { + "text": "Marine", + "start": 84.9, + "end": 85.18, + "confidence": 0.997 + }, + { + "text": "Le", + "start": 85.18, + "end": 85.26, + "confidence": 0.998 + }, + { + "text": "Pen", + "start": 85.26, + "end": 85.44, + "confidence": 0.999 + }, + { + "text": "commence", + "start": 85.44, + "end": 85.78, + "confidence": 0.98 + }, + { + "text": "aujourd'hui", + "start": 85.78, + "end": 86.14, + "confidence": 0.991 + }, + { + "text": "dans", + "start": 86.14, + "end": 86.24, + "confidence": 0.984 + }, + { + "text": "le", + "start": 86.24, + "end": 86.38, + "confidence": 0.913 + }, + { + "text": "Var,", + "start": 86.38, + "end": 86.82, + "confidence": 0.523 + }, + { + "text": "Marine", + "start": 86.82, + "end": 86.96, + "confidence": 0.993 + }, + { + "text": "Le", + "start": 86.96, + "end": 87.04, + "confidence": 0.993 + }, + { + "text": "Pen", + "start": 87.04, + "end": 87.22, + "confidence": 0.999 + }, + { + "text": "sera", + "start": 87.22, + "end": 87.48, + "confidence": 0.991 + }, + { + "text": "en", + "start": 87.48, + "end": 87.68, + "confidence": 0.991 + }, + { + "text": "direct", + "start": 87.68, + "end": 87.98, + "confidence": 0.997 + }, + { + "text": "dans", + "start": 87.98, + "end": 88.3, + "confidence": 0.935 + }, + { + "text": "BFM", + "start": 88.3, + "end": 88.72, + "confidence": 0.997 + }, + { + "text": "story.", + "start": 88.72, + "end": 88.82, + "confidence": 0.827 + } + ] + }, + { + "id": 9, + "seek": 8300, + "start": 89.0, + "end": 92.15, + "text": " Restez avec nous Marine Le Pen dans moins de 3 minutes, à tout de suite.", + "tokens": [ + 13094, + 4371, + 4163, + 4666, + 20415, + 1456, + 10571, + 2680, + 13099, + 368, + 805, + 2077, + 11, + 1531, + 3486, + 368, + 14205, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.10741670781915838, + "compression_ratio": 1.3591549295774648, + "no_speech_prob": 0.00011412434105295688, + "confidence": 0.937, + "words": [ + { + "text": "Restez", + "start": 89.0, + "end": 89.64, + "confidence": 0.966 + }, + { + "text": "avec", + "start": 89.64, + "end": 89.68, + "confidence": 0.997 + }, + { + "text": "nous", + "start": 89.68, + "end": 89.94, + "confidence": 0.968 + }, + { + "text": "Marine", + "start": 89.94, + "end": 90.18, + "confidence": 0.906 + }, + { + "text": "Le", + "start": 90.18, + "end": 90.4, + "confidence": 0.998 + }, + { + "text": "Pen", + "start": 90.4, + "end": 90.68, + "confidence": 0.999 + }, + { + "text": "dans", + "start": 90.68, + "end": 90.88, + "confidence": 0.836 + }, + { + "text": "moins", + "start": 90.88, + "end": 91.18, + "confidence": 0.993 + }, + { + "text": "de", + "start": 91.18, + "end": 91.28, + "confidence": 0.991 + }, + { + "text": "3", + "start": 91.28, + "end": 91.46, + "confidence": 0.609 + }, + { + "text": "minutes,", + "start": 91.46, + "end": 91.86, + "confidence": 0.986 + }, + { + "text": "à", + "start": 91.86, + "end": 91.9, + "confidence": 0.962 + }, + { + "text": "tout", + "start": 91.9, + "end": 92.04, + "confidence": 0.918 + }, + { + "text": "de", + "start": 92.04, + "end": 92.1, + "confidence": 0.999 + }, + { + "text": "suite.", + "start": 92.1, + "end": 92.15, + "confidence": 0.999 + } + ] + }, + { + "id": 10, + "seek": 9200, + "start": 92.15, + "end": 93.74, + "text": " Musique", + "tokens": [ + 3569, + 1925 + ], + "temperature": 0.0, + "avg_logprob": -0.15070751414579503, + "compression_ratio": 1.4545454545454546, + "no_speech_prob": 8.21087378426455e-05, + "confidence": 0.328, + "words": [ + { + "text": "Musique", + "start": 92.15, + "end": 93.74, + "confidence": 0.328 + } + ] + }, + { + "id": 11, + "seek": 9200, + "start": 106.7, + "end": 113.5, + "text": " L'actualité c'est aussi aujourd'hui un dernier adieu, dernier adieu à Laurent Fignon, c'était au cimetière du Père Lachaise à Paris.", + "tokens": [ + 441, + 6, + 578, + 901, + 5066, + 269, + 6, + 377, + 6212, + 14023, + 6, + 10556, + 517, + 29332, + 614, + 19347, + 11, + 29332, + 614, + 19347, + 1531, + 49357, + 479, + 41846, + 11, + 269, + 6, + 9743, + 1609, + 269, + 26123, + 10195, + 1581, + 430, + 4212, + 441, + 27442, + 908, + 1531, + 8380, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.15070751414579503, + "compression_ratio": 1.4545454545454546, + "no_speech_prob": 8.21087378426455e-05, + "confidence": 0.898, + "words": [ + { + "text": "L'actualité", + "start": 106.7, + "end": 107.44, + "confidence": 0.868 + }, + { + "text": "c'est", + "start": 107.44, + "end": 107.66, + "confidence": 0.84 + }, + { + "text": "aussi", + "start": 107.66, + "end": 108.02, + "confidence": 0.804 + }, + { + "text": "aujourd'hui", + "start": 108.02, + "end": 108.38, + "confidence": 0.928 + }, + { + "text": "un", + "start": 108.38, + "end": 108.48, + "confidence": 0.887 + }, + { + "text": "dernier", + "start": 108.48, + "end": 108.8, + "confidence": 0.991 + }, + { + "text": "adieu,", + "start": 108.8, + "end": 109.2, + "confidence": 0.982 + }, + { + "text": "dernier", + "start": 109.2, + "end": 109.38, + "confidence": 0.501 + }, + { + "text": "adieu", + "start": 109.38, + "end": 109.96, + "confidence": 0.997 + }, + { + "text": "à", + "start": 109.96, + "end": 110.12, + "confidence": 0.978 + }, + { + "text": "Laurent", + "start": 110.12, + "end": 110.42, + "confidence": 0.94 + }, + { + "text": "Fignon,", + "start": 110.42, + "end": 111.12, + "confidence": 0.816 + }, + { + "text": "c'était", + "start": 111.12, + "end": 111.24, + "confidence": 0.972 + }, + { + "text": "au", + "start": 111.24, + "end": 111.46, + "confidence": 0.99 + }, + { + "text": "cimetière", + "start": 111.46, + "end": 111.94, + "confidence": 0.984 + }, + { + "text": "du", + "start": 111.94, + "end": 112.14, + "confidence": 0.963 + }, + { + "text": "Père", + "start": 112.14, + "end": 112.36, + "confidence": 0.892 + }, + { + "text": "Lachaise", + "start": 112.36, + "end": 112.88, + "confidence": 0.864 + }, + { + "text": "à", + "start": 112.88, + "end": 113.12, + "confidence": 0.795 + }, + { + "text": "Paris.", + "start": 113.12, + "end": 113.5, + "confidence": 0.998 + } + ] + }, + { + "id": 12, + "seek": 11400, + "start": 114.02, + "end": 120.46, + "text": " L'ancien double vainqueur du Tour de France, vaincu par le cancer à 50 ans, a été incinéré en petit comité aujourd'hui.", + "tokens": [ + 50364, + 441, + 6, + 38840, + 268, + 3834, + 22240, + 1077, + 374, + 1581, + 13077, + 368, + 6190, + 11, + 22240, + 12032, + 971, + 476, + 5592, + 1531, + 2625, + 1567, + 11, + 257, + 8862, + 834, + 259, + 29071, + 465, + 9686, + 395, + 5066, + 14023, + 6, + 10556, + 13, + 50764 + ], + "temperature": 0.0, + "avg_logprob": -0.10655183541147333, + "compression_ratio": 1.1160714285714286, + "no_speech_prob": 0.0002510416379664093, + "confidence": 0.933, + "words": [ + { + "text": "L'ancien", + "start": 114.02, + "end": 114.36, + "confidence": 0.735 + }, + { + "text": "double", + "start": 114.36, + "end": 114.64, + "confidence": 0.991 + }, + { + "text": "vainqueur", + "start": 114.64, + "end": 115.08, + "confidence": 0.996 + }, + { + "text": "du", + "start": 115.08, + "end": 115.18, + "confidence": 0.971 + }, + { + "text": "Tour", + "start": 115.18, + "end": 115.36, + "confidence": 0.828 + }, + { + "text": "de", + "start": 115.36, + "end": 115.5, + "confidence": 0.992 + }, + { + "text": "France,", + "start": 115.5, + "end": 116.32, + "confidence": 0.999 + }, + { + "text": "vaincu", + "start": 116.32, + "end": 116.48, + "confidence": 0.989 + }, + { + "text": "par", + "start": 116.48, + "end": 116.6, + "confidence": 0.997 + }, + { + "text": "le", + "start": 116.6, + "end": 116.74, + "confidence": 0.994 + }, + { + "text": "cancer", + "start": 116.74, + "end": 117.06, + "confidence": 0.966 + }, + { + "text": "à", + "start": 117.06, + "end": 117.24, + "confidence": 0.964 + }, + { + "text": "50", + "start": 117.24, + "end": 117.54, + "confidence": 0.977 + }, + { + "text": "ans,", + "start": 117.54, + "end": 118.34, + "confidence": 0.989 + }, + { + "text": "a", + "start": 118.34, + "end": 118.38, + "confidence": 0.989 + }, + { + "text": "été", + "start": 118.38, + "end": 118.56, + "confidence": 0.996 + }, + { + "text": "incinéré", + "start": 118.56, + "end": 119.24, + "confidence": 0.965 + }, + { + "text": "en", + "start": 119.24, + "end": 119.48, + "confidence": 0.913 + }, + { + "text": "petit", + "start": 119.48, + "end": 119.74, + "confidence": 0.883 + }, + { + "text": "comité", + "start": 119.74, + "end": 120.18, + "confidence": 0.978 + }, + { + "text": "aujourd'hui.", + "start": 120.18, + "end": 120.46, + "confidence": 0.929 + } + ] + } + ], + "language": "fr" +} \ No newline at end of file diff --git a/tests/expected/medium_fr.cpu/smartphone.mp3.words.json b/tests/expected/medium_fr.cpu/smartphone.mp3.words.json new file mode 100644 index 0000000000000000000000000000000000000000..9faa961d5cf4a38b6ac04b76010aeaddb28cee89 --- /dev/null +++ b/tests/expected/medium_fr.cpu/smartphone.mp3.words.json @@ -0,0 +1,4802 @@ +{ + "text": " C'est évident ce que dit Nicolas, mais je ne me l'étais jamais formulé comme ça. Ce qui fait la force du smartphone, c'est pas seulement l'accumulation des fonctions, mais la manière dont elles interagissent entre elles. Ce qui dit d'ailleurs sur la photo, c'est hyper convaincant. Alors évidemment, il faudrait ajouter les interfaces. L'écran tactile a été beaucoup très souvent mentionné. Mais bon, il faut dire qu'il profite aussi de 20 ans pendant lesquels les ordinateurs nous ont appris à cliquer sur des icônes. Sauf que le smartphone ajoute le toucher, ce qui rend le contact plus direct, plus sensible. Et puis évidemment, il faudrait parler aussi des applications qui permettent de contourner le côté touffu de la navigation web pour aller directement au but. Bref, tout ça, ce sont les conditions qui permettent de créer cet objet dont Nicolas dit qu'il est vraisemblablement inédit dans l'histoire de l'humanité. Mais ça, ça soulève une autre interrogation. Est-ce que le fait que cet objet soit inédit induit que notre rapport à lui est aussi un rapport inédit? Je veux dire, est-ce que le rapport qu'on a au smartphone est comparable à celui qu'on entretenait à d'autres objets techniques comme la voiture ou le téléphone? Il n'y a pas d'équivalent en fait. Et donc cette espèce de nouveauté dans la relation à l'objet, c'est fascinant et terrifiant. Parce qu'on a l'impression, comme le disent les utilisateurs et les services, d'être dépendants de cet objet, d'induire en fait une espèce de relation, de médiation avec le monde qui rend de l'ampleur et qui amène aussi à des formes de rejet. Donc, à objet inédit, rapport inédit. Et ce rapport, si j'en crois Nicolas, serait caractérisé par un mélange de dépendance et de rejet. Bon, en vrai, il faudrait remonter très très finement toute l'histoire des objets techniques et de leur insertion dans nos vies pour déterminer si ce rapport est totalement inédit. Mais j'ai l'impression comme ça que Nicolas ne se trompe pas vraiment. Pour autant que je sache, il y a eu plein de discussions autour de la voiture ou même du téléphone. Mais la dépendance n'était pas du même ordre. Donc le rejet non plus n'était pas du même ordre. On peut adorer sa bagnole, en avoir besoin pour plein de choses. Et bien, le soir, quand on va se coucher, on la laisse. On ne l'a pas dans la main quand on est au lit, on ne l'emmène pas au chiottes. On pouvait être énervé par son môme qui occupait la ligne de téléphone pendant une heure chaque soir pour discuter avec un copain. Mais ça ne ressemblait pas à ce qu'on peut ressentir à voir ce même môme aujourd'hui, continuellement avec son smartphone dans la main, comme si c'était une sorte de pacemaker externe, comme si le lâcher allait entraîner sa mort immédiate. Bon, je dis ça pour le môme, mais c'est évidemment valable pour nous aussi. Donc, rapport inédit. D'accord. Mais pourquoi a-t-on l'impression qu'on n'en sortira jamais? Est-ce qu'il faut en remettre la faute sur les gens qui ont créé cet outil merveilleux et diabolique, et diabolique parce que merveilleux? Les économistes parlent de dépendance du sentier. C'est l'idée qu'on est sur un sentier qui a été établi, soit volontairement en marchant dessus, soit en définissant des bornes, en définissant une signalétique.", + "segments": [ + { + "id": 0, + "seek": 0, + "start": 0.38, + "end": 3.62, + "text": " C'est évident ce que dit Nicolas, mais je ne me l'étais jamais formulé comme ça.", + "tokens": [ + 383, + 6, + 377, + 20090, + 1078, + 1769, + 631, + 6176, + 38268, + 11, + 2420, + 1506, + 408, + 385, + 287, + 6, + 22824, + 14540, + 49990, + 526, + 5173, + 2788, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.23666970461409614, + "compression_ratio": 1.6238532110091743, + "no_speech_prob": 0.1567964404821396, + "confidence": 0.935, + "words": [ + { + "text": "C'est", + "start": 0.38, + "end": 0.58, + "confidence": 0.961 + }, + { + "text": "évident", + "start": 0.58, + "end": 0.88, + "confidence": 0.984 + }, + { + "text": "ce", + "start": 0.88, + "end": 1.02, + "confidence": 0.663 + }, + { + "text": "que", + "start": 1.02, + "end": 1.08, + "confidence": 0.989 + }, + { + "text": "dit", + "start": 1.08, + "end": 1.2, + "confidence": 0.994 + }, + { + "text": "Nicolas,", + "start": 1.2, + "end": 1.78, + "confidence": 0.91 + }, + { + "text": "mais", + "start": 1.78, + "end": 1.9, + "confidence": 0.979 + }, + { + "text": "je", + "start": 1.9, + "end": 2.24, + "confidence": 0.982 + }, + { + "text": "ne", + "start": 2.24, + "end": 2.34, + "confidence": 0.835 + }, + { + "text": "me", + "start": 2.34, + "end": 2.38, + "confidence": 0.82 + }, + { + "text": "l'étais", + "start": 2.38, + "end": 2.58, + "confidence": 0.971 + }, + { + "text": "jamais", + "start": 2.58, + "end": 2.84, + "confidence": 0.989 + }, + { + "text": "formulé", + "start": 2.84, + "end": 3.26, + "confidence": 0.909 + }, + { + "text": "comme", + "start": 3.26, + "end": 3.42, + "confidence": 0.993 + }, + { + "text": "ça.", + "start": 3.42, + "end": 3.62, + "confidence": 0.975 + } + ] + }, + { + "id": 1, + "seek": 0, + "start": 4.08, + "end": 7.92, + "text": " Ce qui fait la force du smartphone, c'est pas seulement l'accumulation des fonctions,", + "tokens": [ + 8257, + 1956, + 3887, + 635, + 3464, + 1581, + 13307, + 11, + 269, + 6, + 377, + 1736, + 27772, + 287, + 6, + 8476, + 449, + 2776, + 730, + 17290, + 3916, + 11 + ], + "temperature": 0.0, + "avg_logprob": -0.23666970461409614, + "compression_ratio": 1.6238532110091743, + "no_speech_prob": 0.1567964404821396, + "confidence": 0.93, + "words": [ + { + "text": "Ce", + "start": 4.08, + "end": 4.26, + "confidence": 0.952 + }, + { + "text": "qui", + "start": 4.26, + "end": 4.34, + "confidence": 0.958 + }, + { + "text": "fait", + "start": 4.34, + "end": 4.48, + "confidence": 0.565 + }, + { + "text": "la", + "start": 4.48, + "end": 4.66, + "confidence": 0.971 + }, + { + "text": "force", + "start": 4.66, + "end": 5.0, + "confidence": 0.999 + }, + { + "text": "du", + "start": 5.0, + "end": 5.2, + "confidence": 0.996 + }, + { + "text": "smartphone,", + "start": 5.2, + "end": 5.88, + "confidence": 0.911 + }, + { + "text": "c'est", + "start": 5.88, + "end": 6.12, + "confidence": 0.88 + }, + { + "text": "pas", + "start": 6.12, + "end": 6.26, + "confidence": 0.992 + }, + { + "text": "seulement", + "start": 6.26, + "end": 6.52, + "confidence": 0.999 + }, + { + "text": "l'accumulation", + "start": 6.52, + "end": 7.38, + "confidence": 0.958 + }, + { + "text": "des", + "start": 7.38, + "end": 7.56, + "confidence": 0.983 + }, + { + "text": "fonctions,", + "start": 7.56, + "end": 7.92, + "confidence": 0.987 + } + ] + }, + { + "id": 2, + "seek": 0, + "start": 8.32, + "end": 10.88, + "text": " mais la manière dont elles interagissent entre elles.", + "tokens": [ + 2420, + 635, + 22267, + 9400, + 23576, + 728, + 559, + 25450, + 3962, + 23576, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.23666970461409614, + "compression_ratio": 1.6238532110091743, + "no_speech_prob": 0.1567964404821396, + "confidence": 0.977, + "words": [ + { + "text": "mais", + "start": 8.32, + "end": 8.44, + "confidence": 0.992 + }, + { + "text": "la", + "start": 8.44, + "end": 8.6, + "confidence": 0.995 + }, + { + "text": "manière", + "start": 8.6, + "end": 8.9, + "confidence": 0.999 + }, + { + "text": "dont", + "start": 8.9, + "end": 9.1, + "confidence": 0.978 + }, + { + "text": "elles", + "start": 9.1, + "end": 9.48, + "confidence": 0.967 + }, + { + "text": "interagissent", + "start": 9.48, + "end": 10.32, + "confidence": 0.964 + }, + { + "text": "entre", + "start": 10.32, + "end": 10.58, + "confidence": 0.956 + }, + { + "text": "elles.", + "start": 10.58, + "end": 10.88, + "confidence": 0.99 + } + ] + }, + { + "id": 3, + "seek": 0, + "start": 10.96, + "end": 13.0, + "text": " Ce qui dit d'ailleurs sur la photo, c'est hyper convaincant.", + "tokens": [ + 8257, + 1956, + 6176, + 274, + 6, + 19400, + 1022, + 635, + 5052, + 11, + 269, + 6, + 377, + 9848, + 3754, + 491, + 66, + 394, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.23666970461409614, + "compression_ratio": 1.6238532110091743, + "no_speech_prob": 0.1567964404821396, + "confidence": 0.906, + "words": [ + { + "text": "Ce", + "start": 10.96, + "end": 11.16, + "confidence": 0.607 + }, + { + "text": "qui", + "start": 11.16, + "end": 11.22, + "confidence": 0.765 + }, + { + "text": "dit", + "start": 11.22, + "end": 11.4, + "confidence": 0.983 + }, + { + "text": "d'ailleurs", + "start": 11.4, + "end": 11.56, + "confidence": 0.985 + }, + { + "text": "sur", + "start": 11.56, + "end": 11.72, + "confidence": 0.477 + }, + { + "text": "la", + "start": 11.72, + "end": 11.78, + "confidence": 0.984 + }, + { + "text": "photo,", + "start": 11.78, + "end": 12.12, + "confidence": 0.994 + }, + { + "text": "c'est", + "start": 12.12, + "end": 12.2, + "confidence": 0.997 + }, + { + "text": "hyper", + "start": 12.2, + "end": 12.42, + "confidence": 0.993 + }, + { + "text": "convaincant.", + "start": 12.42, + "end": 13.0, + "confidence": 0.982 + } + ] + }, + { + "id": 4, + "seek": 0, + "start": 13.34, + "end": 16.02, + "text": " Alors évidemment, il faudrait ajouter les interfaces.", + "tokens": [ + 9946, + 24724, + 11, + 1930, + 38694, + 8645, + 17680, + 23985, + 1512, + 28416, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.23666970461409614, + "compression_ratio": 1.6238532110091743, + "no_speech_prob": 0.1567964404821396, + "confidence": 0.913, + "words": [ + { + "text": "Alors", + "start": 13.34, + "end": 13.62, + "confidence": 0.585 + }, + { + "text": "évidemment,", + "start": 13.62, + "end": 14.34, + "confidence": 0.832 + }, + { + "text": "il", + "start": 14.34, + "end": 14.38, + "confidence": 0.952 + }, + { + "text": "faudrait", + "start": 14.38, + "end": 14.74, + "confidence": 0.996 + }, + { + "text": "ajouter", + "start": 14.74, + "end": 15.16, + "confidence": 0.992 + }, + { + "text": "les", + "start": 15.16, + "end": 15.52, + "confidence": 0.985 + }, + { + "text": "interfaces.", + "start": 15.52, + "end": 16.02, + "confidence": 0.984 + } + ] + }, + { + "id": 5, + "seek": 0, + "start": 16.22, + "end": 19.36, + "text": " L'écran tactile a été beaucoup très souvent mentionné.", + "tokens": [ + 441, + 6, + 9062, + 4257, + 47319, + 257, + 8862, + 8796, + 5732, + 20847, + 2152, + 15055, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.23666970461409614, + "compression_ratio": 1.6238532110091743, + "no_speech_prob": 0.1567964404821396, + "confidence": 0.923, + "words": [ + { + "text": "L'écran", + "start": 16.22, + "end": 16.7, + "confidence": 0.996 + }, + { + "text": "tactile", + "start": 16.7, + "end": 17.06, + "confidence": 0.986 + }, + { + "text": "a", + "start": 17.06, + "end": 17.26, + "confidence": 0.98 + }, + { + "text": "été", + "start": 17.26, + "end": 17.88, + "confidence": 0.975 + }, + { + "text": "beaucoup", + "start": 17.88, + "end": 18.28, + "confidence": 0.976 + }, + { + "text": "très", + "start": 18.28, + "end": 18.62, + "confidence": 0.447 + }, + { + "text": "souvent", + "start": 18.62, + "end": 18.9, + "confidence": 0.996 + }, + { + "text": "mentionné.", + "start": 18.9, + "end": 19.36, + "confidence": 0.978 + } + ] + }, + { + "id": 6, + "seek": 0, + "start": 19.84, + "end": 25.26, + "text": " Mais bon, il faut dire qu'il profite aussi de 20 ans pendant lesquels les ordinateurs nous ont appris à cliquer sur des icônes.", + "tokens": [ + 6313, + 4428, + 11, + 1930, + 8487, + 1264, + 421, + 6, + 388, + 1740, + 642, + 6212, + 368, + 945, + 1567, + 17338, + 1512, + 358, + 1625, + 1512, + 4792, + 13923, + 2156, + 4666, + 6592, + 724, + 5714, + 1531, + 596, + 23909, + 1022, + 730, + 4376, + 2851, + 4081, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.23666970461409614, + "compression_ratio": 1.6238532110091743, + "no_speech_prob": 0.1567964404821396, + "confidence": 0.92, + "words": [ + { + "text": "Mais", + "start": 19.84, + "end": 20.22, + "confidence": 0.944 + }, + { + "text": "bon,", + "start": 20.22, + "end": 20.52, + "confidence": 0.667 + }, + { + "text": "il", + "start": 20.52, + "end": 20.6, + "confidence": 0.99 + }, + { + "text": "faut", + "start": 20.6, + "end": 20.7, + "confidence": 0.99 + }, + { + "text": "dire", + "start": 20.7, + "end": 20.84, + "confidence": 0.995 + }, + { + "text": "qu'il", + "start": 20.84, + "end": 20.96, + "confidence": 0.88 + }, + { + "text": "profite", + "start": 20.96, + "end": 21.26, + "confidence": 0.995 + }, + { + "text": "aussi", + "start": 21.26, + "end": 21.68, + "confidence": 0.972 + }, + { + "text": "de", + "start": 21.68, + "end": 21.9, + "confidence": 0.97 + }, + { + "text": "20", + "start": 21.9, + "end": 22.1, + "confidence": 0.812 + }, + { + "text": "ans", + "start": 22.1, + "end": 22.32, + "confidence": 0.997 + }, + { + "text": "pendant", + "start": 22.32, + "end": 22.48, + "confidence": 0.72 + }, + { + "text": "lesquels", + "start": 22.48, + "end": 22.92, + "confidence": 0.98 + }, + { + "text": "les", + "start": 22.92, + "end": 23.04, + "confidence": 0.709 + }, + { + "text": "ordinateurs", + "start": 23.04, + "end": 23.54, + "confidence": 0.965 + }, + { + "text": "nous", + "start": 23.54, + "end": 23.72, + "confidence": 0.602 + }, + { + "text": "ont", + "start": 23.72, + "end": 23.82, + "confidence": 0.974 + }, + { + "text": "appris", + "start": 23.82, + "end": 24.1, + "confidence": 0.991 + }, + { + "text": "à", + "start": 24.1, + "end": 24.24, + "confidence": 0.829 + }, + { + "text": "cliquer", + "start": 24.24, + "end": 24.5, + "confidence": 0.989 + }, + { + "text": "sur", + "start": 24.5, + "end": 24.66, + "confidence": 0.984 + }, + { + "text": "des", + "start": 24.66, + "end": 24.94, + "confidence": 0.971 + }, + { + "text": "icônes.", + "start": 24.94, + "end": 25.26, + "confidence": 0.992 + } + ] + }, + { + "id": 7, + "seek": 2534, + "start": 25.42, + "end": 30.64, + "text": " Sauf que le smartphone ajoute le toucher, ce qui rend le contact plus direct, plus sensible.", + "tokens": [ + 318, + 9507, + 631, + 476, + 13307, + 17680, + 14040, + 476, + 2557, + 260, + 11, + 1769, + 1956, + 6125, + 476, + 3385, + 1804, + 2047, + 11, + 1804, + 25380, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.07915337880452473, + "compression_ratio": 1.6254416961130742, + "no_speech_prob": 3.457161710684886e-06, + "confidence": 0.969, + "words": [ + { + "text": "Sauf", + "start": 25.42, + "end": 25.76, + "confidence": 0.99 + }, + { + "text": "que", + "start": 25.76, + "end": 26.26, + "confidence": 0.996 + }, + { + "text": "le", + "start": 26.26, + "end": 26.66, + "confidence": 0.631 + }, + { + "text": "smartphone", + "start": 26.66, + "end": 27.06, + "confidence": 0.996 + }, + { + "text": "ajoute", + "start": 27.06, + "end": 27.44, + "confidence": 0.991 + }, + { + "text": "le", + "start": 27.44, + "end": 27.62, + "confidence": 0.992 + }, + { + "text": "toucher,", + "start": 27.62, + "end": 28.18, + "confidence": 0.988 + }, + { + "text": "ce", + "start": 28.18, + "end": 28.22, + "confidence": 0.99 + }, + { + "text": "qui", + "start": 28.22, + "end": 28.28, + "confidence": 1.0 + }, + { + "text": "rend", + "start": 28.28, + "end": 28.48, + "confidence": 0.994 + }, + { + "text": "le", + "start": 28.48, + "end": 28.68, + "confidence": 0.993 + }, + { + "text": "contact", + "start": 28.68, + "end": 29.1, + "confidence": 0.999 + }, + { + "text": "plus", + "start": 29.1, + "end": 29.46, + "confidence": 0.985 + }, + { + "text": "direct,", + "start": 29.46, + "end": 30.22, + "confidence": 0.995 + }, + { + "text": "plus", + "start": 30.22, + "end": 30.26, + "confidence": 0.994 + }, + { + "text": "sensible.", + "start": 30.26, + "end": 30.64, + "confidence": 0.997 + } + ] + }, + { + "id": 8, + "seek": 2534, + "start": 31.04, + "end": 37.82, + "text": " Et puis évidemment, il faudrait parler aussi des applications qui permettent de contourner le côté touffu de la navigation web pour aller directement au but.", + "tokens": [ + 3790, + 9093, + 24724, + 11, + 1930, + 38694, + 8645, + 16421, + 6212, + 730, + 5821, + 1956, + 21540, + 317, + 368, + 21234, + 1193, + 476, + 18437, + 10095, + 602, + 84, + 368, + 635, + 17346, + 3670, + 2016, + 8722, + 37297, + 1609, + 457, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.07915337880452473, + "compression_ratio": 1.6254416961130742, + "no_speech_prob": 3.457161710684886e-06, + "confidence": 0.892, + "words": [ + { + "text": "Et", + "start": 31.04, + "end": 31.22, + "confidence": 0.97 + }, + { + "text": "puis", + "start": 31.22, + "end": 31.36, + "confidence": 0.971 + }, + { + "text": "évidemment,", + "start": 31.36, + "end": 31.7, + "confidence": 0.875 + }, + { + "text": "il", + "start": 31.7, + "end": 31.74, + "confidence": 0.993 + }, + { + "text": "faudrait", + "start": 31.74, + "end": 31.94, + "confidence": 0.995 + }, + { + "text": "parler", + "start": 31.94, + "end": 32.12, + "confidence": 0.84 + }, + { + "text": "aussi", + "start": 32.12, + "end": 32.34, + "confidence": 0.977 + }, + { + "text": "des", + "start": 32.34, + "end": 32.48, + "confidence": 0.994 + }, + { + "text": "applications", + "start": 32.48, + "end": 32.9, + "confidence": 0.993 + }, + { + "text": "qui", + "start": 32.9, + "end": 33.18, + "confidence": 0.481 + }, + { + "text": "permettent", + "start": 33.18, + "end": 33.74, + "confidence": 0.992 + }, + { + "text": "de", + "start": 33.74, + "end": 33.96, + "confidence": 0.885 + }, + { + "text": "contourner", + "start": 33.96, + "end": 34.42, + "confidence": 0.958 + }, + { + "text": "le", + "start": 34.42, + "end": 34.52, + "confidence": 0.775 + }, + { + "text": "côté", + "start": 34.52, + "end": 34.8, + "confidence": 0.984 + }, + { + "text": "touffu", + "start": 34.8, + "end": 35.32, + "confidence": 0.741 + }, + { + "text": "de", + "start": 35.32, + "end": 35.72, + "confidence": 0.882 + }, + { + "text": "la", + "start": 35.72, + "end": 35.78, + "confidence": 0.992 + }, + { + "text": "navigation", + "start": 35.78, + "end": 36.24, + "confidence": 0.994 + }, + { + "text": "web", + "start": 36.24, + "end": 36.6, + "confidence": 0.854 + }, + { + "text": "pour", + "start": 36.6, + "end": 36.78, + "confidence": 0.585 + }, + { + "text": "aller", + "start": 36.78, + "end": 36.98, + "confidence": 0.987 + }, + { + "text": "directement", + "start": 36.98, + "end": 37.52, + "confidence": 0.997 + }, + { + "text": "au", + "start": 37.52, + "end": 37.68, + "confidence": 0.967 + }, + { + "text": "but.", + "start": 37.68, + "end": 37.82, + "confidence": 0.995 + } + ] + }, + { + "id": 9, + "seek": 2534, + "start": 37.82, + "end": 46.54, + "text": " Bref, tout ça, ce sont les conditions qui permettent de créer cet objet dont Nicolas dit qu'il est vraisemblablement inédit dans l'histoire de l'humanité.", + "tokens": [ + 49957, + 11, + 3486, + 2788, + 11, + 1769, + 4900, + 1512, + 4487, + 1956, + 21540, + 317, + 368, + 32062, + 8603, + 14964, + 9400, + 38268, + 6176, + 421, + 6, + 388, + 871, + 6070, + 271, + 443, + 5199, + 712, + 518, + 294, + 7811, + 270, + 2680, + 287, + 6, + 29093, + 368, + 287, + 6, + 18796, + 5066, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.07915337880452473, + "compression_ratio": 1.6254416961130742, + "no_speech_prob": 3.457161710684886e-06, + "confidence": 0.974, + "words": [ + { + "text": "Bref,", + "start": 37.82, + "end": 38.76, + "confidence": 0.987 + }, + { + "text": "tout", + "start": 38.76, + "end": 38.98, + "confidence": 0.711 + }, + { + "text": "ça,", + "start": 38.98, + "end": 39.42, + "confidence": 0.995 + }, + { + "text": "ce", + "start": 39.42, + "end": 39.7, + "confidence": 0.993 + }, + { + "text": "sont", + "start": 39.7, + "end": 39.88, + "confidence": 0.999 + }, + { + "text": "les", + "start": 39.88, + "end": 40.16, + "confidence": 0.991 + }, + { + "text": "conditions", + "start": 40.16, + "end": 40.68, + "confidence": 0.995 + }, + { + "text": "qui", + "start": 40.68, + "end": 40.96, + "confidence": 0.997 + }, + { + "text": "permettent", + "start": 40.96, + "end": 41.46, + "confidence": 0.997 + }, + { + "text": "de", + "start": 41.46, + "end": 41.6, + "confidence": 0.998 + }, + { + "text": "créer", + "start": 41.6, + "end": 42.06, + "confidence": 0.998 + }, + { + "text": "cet", + "start": 42.06, + "end": 42.38, + "confidence": 0.998 + }, + { + "text": "objet", + "start": 42.38, + "end": 42.6, + "confidence": 0.994 + }, + { + "text": "dont", + "start": 42.6, + "end": 42.8, + "confidence": 0.779 + }, + { + "text": "Nicolas", + "start": 42.8, + "end": 43.26, + "confidence": 0.989 + }, + { + "text": "dit", + "start": 43.26, + "end": 43.5, + "confidence": 0.986 + }, + { + "text": "qu'il", + "start": 43.5, + "end": 43.7, + "confidence": 0.983 + }, + { + "text": "est", + "start": 43.7, + "end": 43.88, + "confidence": 0.991 + }, + { + "text": "vraisemblablement", + "start": 43.88, + "end": 44.98, + "confidence": 0.991 + }, + { + "text": "inédit", + "start": 44.98, + "end": 45.38, + "confidence": 0.98 + }, + { + "text": "dans", + "start": 45.38, + "end": 45.7, + "confidence": 0.969 + }, + { + "text": "l'histoire", + "start": 45.7, + "end": 45.98, + "confidence": 0.957 + }, + { + "text": "de", + "start": 45.98, + "end": 46.18, + "confidence": 0.999 + }, + { + "text": "l'humanité.", + "start": 46.18, + "end": 46.54, + "confidence": 0.992 + } + ] + }, + { + "id": 10, + "seek": 2534, + "start": 46.54, + "end": 48.82, + "text": " Mais ça, ça soulève une autre interrogation.", + "tokens": [ + 6313, + 2788, + 11, + 2788, + 5133, + 31397, + 2251, + 15081, + 24871, + 399, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.07915337880452473, + "compression_ratio": 1.6254416961130742, + "no_speech_prob": 3.457161710684886e-06, + "confidence": 0.969, + "words": [ + { + "text": "Mais", + "start": 46.54, + "end": 47.24, + "confidence": 0.846 + }, + { + "text": "ça,", + "start": 47.24, + "end": 47.72, + "confidence": 0.935 + }, + { + "text": "ça", + "start": 47.72, + "end": 47.76, + "confidence": 0.977 + }, + { + "text": "soulève", + "start": 47.76, + "end": 47.84, + "confidence": 0.993 + }, + { + "text": "une", + "start": 47.84, + "end": 48.02, + "confidence": 0.998 + }, + { + "text": "autre", + "start": 48.02, + "end": 48.26, + "confidence": 0.999 + }, + { + "text": "interrogation.", + "start": 48.26, + "end": 48.82, + "confidence": 0.997 + } + ] + }, + { + "id": 11, + "seek": 4884, + "start": 49.22, + "end": 55.46, + "text": " Est-ce que le fait que cet objet soit inédit induit que notre rapport à lui est aussi un rapport inédit?", + "tokens": [ + 4410, + 12, + 384, + 631, + 476, + 3887, + 631, + 8603, + 14964, + 12703, + 294, + 7811, + 270, + 13716, + 270, + 631, + 10349, + 18018, + 1531, + 8783, + 871, + 6212, + 517, + 18018, + 294, + 7811, + 270, + 2506 + ], + "temperature": 0.0, + "avg_logprob": -0.10746372298689078, + "compression_ratio": 1.662379421221865, + "no_speech_prob": 1.3105129255563952e-05, + "confidence": 0.988, + "words": [ + { + "text": "Est-ce", + "start": 49.22, + "end": 49.62, + "confidence": 0.982 + }, + { + "text": "que", + "start": 49.62, + "end": 49.72, + "confidence": 0.991 + }, + { + "text": "le", + "start": 49.72, + "end": 49.82, + "confidence": 0.993 + }, + { + "text": "fait", + "start": 49.82, + "end": 49.98, + "confidence": 0.999 + }, + { + "text": "que", + "start": 49.98, + "end": 50.14, + "confidence": 0.991 + }, + { + "text": "cet", + "start": 50.14, + "end": 50.32, + "confidence": 0.991 + }, + { + "text": "objet", + "start": 50.32, + "end": 50.66, + "confidence": 0.997 + }, + { + "text": "soit", + "start": 50.66, + "end": 51.12, + "confidence": 0.995 + }, + { + "text": "inédit", + "start": 51.12, + "end": 51.8, + "confidence": 0.996 + }, + { + "text": "induit", + "start": 51.8, + "end": 52.32, + "confidence": 0.977 + }, + { + "text": "que", + "start": 52.32, + "end": 52.42, + "confidence": 0.983 + }, + { + "text": "notre", + "start": 52.42, + "end": 52.72, + "confidence": 0.996 + }, + { + "text": "rapport", + "start": 52.72, + "end": 53.28, + "confidence": 0.997 + }, + { + "text": "à", + "start": 53.28, + "end": 53.44, + "confidence": 0.978 + }, + { + "text": "lui", + "start": 53.44, + "end": 53.66, + "confidence": 0.999 + }, + { + "text": "est", + "start": 53.66, + "end": 54.02, + "confidence": 0.916 + }, + { + "text": "aussi", + "start": 54.02, + "end": 54.54, + "confidence": 0.995 + }, + { + "text": "un", + "start": 54.54, + "end": 54.7, + "confidence": 0.995 + }, + { + "text": "rapport", + "start": 54.7, + "end": 55.0, + "confidence": 0.996 + }, + { + "text": "inédit?", + "start": 55.0, + "end": 55.46, + "confidence": 0.996 + } + ] + }, + { + "id": 12, + "seek": 4884, + "start": 55.46, + "end": 63.12, + "text": " Je veux dire, est-ce que le rapport qu'on a au smartphone est comparable à celui qu'on entretenait à d'autres objets techniques comme la voiture ou le téléphone?", + "tokens": [ + 2588, + 16389, + 1264, + 11, + 871, + 12, + 384, + 631, + 476, + 18018, + 421, + 6, + 266, + 257, + 1609, + 13307, + 871, + 25323, + 1531, + 22829, + 421, + 6, + 266, + 3962, + 1147, + 1001, + 1531, + 274, + 6, + 16752, + 1111, + 25349, + 7512, + 5173, + 635, + 38859, + 2820, + 476, + 47159, + 2506 + ], + "temperature": 0.0, + "avg_logprob": -0.10746372298689078, + "compression_ratio": 1.662379421221865, + "no_speech_prob": 1.3105129255563952e-05, + "confidence": 0.965, + "words": [ + { + "text": "Je", + "start": 55.46, + "end": 55.9, + "confidence": 0.88 + }, + { + "text": "veux", + "start": 55.9, + "end": 56.0, + "confidence": 0.988 + }, + { + "text": "dire,", + "start": 56.0, + "end": 56.24, + "confidence": 0.997 + }, + { + "text": "est-ce", + "start": 56.24, + "end": 56.36, + "confidence": 0.99 + }, + { + "text": "que", + "start": 56.36, + "end": 56.42, + "confidence": 0.99 + }, + { + "text": "le", + "start": 56.42, + "end": 56.58, + "confidence": 0.995 + }, + { + "text": "rapport", + "start": 56.58, + "end": 56.88, + "confidence": 0.998 + }, + { + "text": "qu'on", + "start": 56.88, + "end": 57.04, + "confidence": 0.986 + }, + { + "text": "a", + "start": 57.04, + "end": 57.18, + "confidence": 0.989 + }, + { + "text": "au", + "start": 57.18, + "end": 57.28, + "confidence": 0.968 + }, + { + "text": "smartphone", + "start": 57.28, + "end": 57.6, + "confidence": 0.994 + }, + { + "text": "est", + "start": 57.6, + "end": 57.92, + "confidence": 0.95 + }, + { + "text": "comparable", + "start": 57.92, + "end": 58.24, + "confidence": 0.997 + }, + { + "text": "à", + "start": 58.24, + "end": 58.48, + "confidence": 0.949 + }, + { + "text": "celui", + "start": 58.48, + "end": 58.66, + "confidence": 0.998 + }, + { + "text": "qu'on", + "start": 58.66, + "end": 58.9, + "confidence": 0.989 + }, + { + "text": "entretenait", + "start": 58.9, + "end": 59.32, + "confidence": 0.929 + }, + { + "text": "à", + "start": 59.32, + "end": 59.46, + "confidence": 0.958 + }, + { + "text": "d'autres", + "start": 59.46, + "end": 59.7, + "confidence": 0.997 + }, + { + "text": "objets", + "start": 59.7, + "end": 59.96, + "confidence": 0.991 + }, + { + "text": "techniques", + "start": 59.96, + "end": 60.46, + "confidence": 0.983 + }, + { + "text": "comme", + "start": 60.46, + "end": 60.88, + "confidence": 0.587 + }, + { + "text": "la", + "start": 60.88, + "end": 61.5, + "confidence": 0.987 + }, + { + "text": "voiture", + "start": 61.5, + "end": 62.06, + "confidence": 1.0 + }, + { + "text": "ou", + "start": 62.06, + "end": 62.36, + "confidence": 0.945 + }, + { + "text": "le", + "start": 62.36, + "end": 62.68, + "confidence": 0.998 + }, + { + "text": "téléphone?", + "start": 62.68, + "end": 63.12, + "confidence": 0.999 + } + ] + }, + { + "id": 13, + "seek": 4884, + "start": 63.36, + "end": 66.66, + "text": " Il n'y a pas d'équivalent en fait.", + "tokens": [ + 4416, + 297, + 6, + 88, + 257, + 1736, + 274, + 6, + 20183, + 3576, + 317, + 465, + 3887, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.10746372298689078, + "compression_ratio": 1.662379421221865, + "no_speech_prob": 1.3105129255563952e-05, + "confidence": 0.936, + "words": [ + { + "text": "Il", + "start": 63.36, + "end": 65.42, + "confidence": 0.779 + }, + { + "text": "n'y", + "start": 65.42, + "end": 65.48, + "confidence": 0.978 + }, + { + "text": "a", + "start": 65.48, + "end": 65.54, + "confidence": 0.992 + }, + { + "text": "pas", + "start": 65.54, + "end": 65.66, + "confidence": 0.999 + }, + { + "text": "d'équivalent", + "start": 65.66, + "end": 66.22, + "confidence": 0.995 + }, + { + "text": "en", + "start": 66.22, + "end": 66.42, + "confidence": 0.601 + }, + { + "text": "fait.", + "start": 66.42, + "end": 66.66, + "confidence": 0.996 + } + ] + }, + { + "id": 14, + "seek": 4884, + "start": 66.88, + "end": 71.52, + "text": " Et donc cette espèce de nouveauté dans la relation à l'objet, c'est fascinant et terrifiant.", + "tokens": [ + 3790, + 5926, + 5550, + 7089, + 30236, + 368, + 11456, + 1375, + 526, + 2680, + 635, + 9721, + 1531, + 287, + 6, + 996, + 7108, + 11, + 269, + 6, + 377, + 7184, + 259, + 394, + 1030, + 7245, + 351, + 5798, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.10746372298689078, + "compression_ratio": 1.662379421221865, + "no_speech_prob": 1.3105129255563952e-05, + "confidence": 0.953, + "words": [ + { + "text": "Et", + "start": 66.88, + "end": 66.98, + "confidence": 0.599 + }, + { + "text": "donc", + "start": 66.98, + "end": 67.08, + "confidence": 0.901 + }, + { + "text": "cette", + "start": 67.08, + "end": 67.28, + "confidence": 0.71 + }, + { + "text": "espèce", + "start": 67.28, + "end": 67.54, + "confidence": 0.995 + }, + { + "text": "de", + "start": 67.54, + "end": 67.68, + "confidence": 0.999 + }, + { + "text": "nouveauté", + "start": 67.68, + "end": 68.48, + "confidence": 0.979 + }, + { + "text": "dans", + "start": 68.48, + "end": 68.66, + "confidence": 0.98 + }, + { + "text": "la", + "start": 68.66, + "end": 68.94, + "confidence": 0.995 + }, + { + "text": "relation", + "start": 68.94, + "end": 69.22, + "confidence": 0.998 + }, + { + "text": "à", + "start": 69.22, + "end": 69.38, + "confidence": 0.997 + }, + { + "text": "l'objet,", + "start": 69.38, + "end": 70.24, + "confidence": 0.997 + }, + { + "text": "c'est", + "start": 70.24, + "end": 70.38, + "confidence": 0.98 + }, + { + "text": "fascinant", + "start": 70.38, + "end": 70.64, + "confidence": 0.978 + }, + { + "text": "et", + "start": 70.64, + "end": 70.76, + "confidence": 0.964 + }, + { + "text": "terrifiant.", + "start": 70.76, + "end": 71.52, + "confidence": 0.977 + } + ] + }, + { + "id": 15, + "seek": 4884, + "start": 71.62, + "end": 76.48, + "text": " Parce qu'on a l'impression, comme le disent les utilisateurs et les services, d'être dépendants de cet objet,", + "tokens": [ + 20429, + 421, + 6, + 266, + 257, + 287, + 6, + 36107, + 11, + 5173, + 476, + 37313, + 1512, + 33643, + 25929, + 1030, + 1512, + 3328, + 11, + 274, + 6, + 9498, + 45768, + 1719, + 368, + 8603, + 14964, + 11 + ], + "temperature": 0.0, + "avg_logprob": -0.10746372298689078, + "compression_ratio": 1.662379421221865, + "no_speech_prob": 1.3105129255563952e-05, + "confidence": 0.813, + "words": [ + { + "text": "Parce", + "start": 71.62, + "end": 71.86, + "confidence": 0.512 + }, + { + "text": "qu'on", + "start": 71.86, + "end": 72.12, + "confidence": 0.937 + }, + { + "text": "a", + "start": 72.12, + "end": 72.44, + "confidence": 0.982 + }, + { + "text": "l'impression,", + "start": 72.44, + "end": 73.56, + "confidence": 0.998 + }, + { + "text": "comme", + "start": 73.56, + "end": 73.84, + "confidence": 0.964 + }, + { + "text": "le", + "start": 73.84, + "end": 74.0, + "confidence": 0.984 + }, + { + "text": "disent", + "start": 74.0, + "end": 74.2, + "confidence": 0.998 + }, + { + "text": "les", + "start": 74.2, + "end": 74.4, + "confidence": 0.994 + }, + { + "text": "utilisateurs", + "start": 74.4, + "end": 74.84, + "confidence": 0.997 + }, + { + "text": "et", + "start": 74.84, + "end": 74.96, + "confidence": 0.329 + }, + { + "text": "les", + "start": 74.96, + "end": 75.0, + "confidence": 0.773 + }, + { + "text": "services,", + "start": 75.0, + "end": 75.22, + "confidence": 0.214 + }, + { + "text": "d'être", + "start": 75.22, + "end": 75.42, + "confidence": 0.766 + }, + { + "text": "dépendants", + "start": 75.42, + "end": 75.96, + "confidence": 0.789 + }, + { + "text": "de", + "start": 75.96, + "end": 76.08, + "confidence": 0.986 + }, + { + "text": "cet", + "start": 76.08, + "end": 76.26, + "confidence": 0.996 + }, + { + "text": "objet,", + "start": 76.26, + "end": 76.48, + "confidence": 0.996 + } + ] + }, + { + "id": 16, + "seek": 7684, + "start": 76.86, + "end": 83.26, + "text": " d'induire en fait une espèce de relation, de médiation avec le monde qui rend de l'ampleur et qui amène aussi à des formes de rejet.", + "tokens": [ + 274, + 6, + 471, + 43612, + 465, + 3887, + 2251, + 7089, + 30236, + 368, + 9721, + 11, + 368, + 42436, + 399, + 4163, + 476, + 10431, + 1956, + 6125, + 368, + 287, + 6, + 335, + 781, + 374, + 1030, + 1956, + 669, + 18832, + 6212, + 1531, + 730, + 1254, + 279, + 368, + 319, + 7108, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.06937986261704389, + "compression_ratio": 1.6787003610108304, + "no_speech_prob": 5.948771558905719e-06, + "confidence": 0.917, + "words": [ + { + "text": "d'induire", + "start": 76.86, + "end": 77.08, + "confidence": 0.841 + }, + { + "text": "en", + "start": 77.08, + "end": 77.24, + "confidence": 0.618 + }, + { + "text": "fait", + "start": 77.24, + "end": 77.34, + "confidence": 0.994 + }, + { + "text": "une", + "start": 77.34, + "end": 77.52, + "confidence": 0.983 + }, + { + "text": "espèce", + "start": 77.52, + "end": 77.88, + "confidence": 0.996 + }, + { + "text": "de", + "start": 77.88, + "end": 78.48, + "confidence": 0.997 + }, + { + "text": "relation,", + "start": 78.48, + "end": 78.6, + "confidence": 0.596 + }, + { + "text": "de", + "start": 78.6, + "end": 78.94, + "confidence": 0.987 + }, + { + "text": "médiation", + "start": 78.94, + "end": 79.52, + "confidence": 0.997 + }, + { + "text": "avec", + "start": 79.52, + "end": 79.74, + "confidence": 0.967 + }, + { + "text": "le", + "start": 79.74, + "end": 79.92, + "confidence": 0.998 + }, + { + "text": "monde", + "start": 79.92, + "end": 80.64, + "confidence": 0.992 + }, + { + "text": "qui", + "start": 80.64, + "end": 81.1, + "confidence": 0.696 + }, + { + "text": "rend", + "start": 81.1, + "end": 81.64, + "confidence": 0.91 + }, + { + "text": "de", + "start": 81.64, + "end": 81.78, + "confidence": 0.712 + }, + { + "text": "l'ampleur", + "start": 81.78, + "end": 82.02, + "confidence": 0.987 + }, + { + "text": "et", + "start": 82.02, + "end": 82.12, + "confidence": 0.931 + }, + { + "text": "qui", + "start": 82.12, + "end": 82.24, + "confidence": 0.976 + }, + { + "text": "amène", + "start": 82.24, + "end": 82.36, + "confidence": 0.973 + }, + { + "text": "aussi", + "start": 82.36, + "end": 82.56, + "confidence": 0.938 + }, + { + "text": "à", + "start": 82.56, + "end": 82.62, + "confidence": 0.941 + }, + { + "text": "des", + "start": 82.62, + "end": 82.72, + "confidence": 0.992 + }, + { + "text": "formes", + "start": 82.72, + "end": 82.9, + "confidence": 0.993 + }, + { + "text": "de", + "start": 82.9, + "end": 83.02, + "confidence": 0.998 + }, + { + "text": "rejet.", + "start": 83.02, + "end": 83.26, + "confidence": 0.883 + } + ] + }, + { + "id": 17, + "seek": 7684, + "start": 83.94, + "end": 87.8, + "text": " Donc, à objet inédit, rapport inédit.", + "tokens": [ + 7477, + 11, + 1531, + 14964, + 294, + 7811, + 270, + 11, + 18018, + 294, + 7811, + 270, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.06937986261704389, + "compression_ratio": 1.6787003610108304, + "no_speech_prob": 5.948771558905719e-06, + "confidence": 0.962, + "words": [ + { + "text": "Donc,", + "start": 83.94, + "end": 84.94, + "confidence": 0.971 + }, + { + "text": "à", + "start": 84.94, + "end": 84.98, + "confidence": 0.88 + }, + { + "text": "objet", + "start": 84.98, + "end": 85.36, + "confidence": 0.828 + }, + { + "text": "inédit,", + "start": 85.36, + "end": 86.56, + "confidence": 0.993 + }, + { + "text": "rapport", + "start": 86.56, + "end": 87.0, + "confidence": 0.981 + }, + { + "text": "inédit.", + "start": 87.0, + "end": 87.8, + "confidence": 0.998 + } + ] + }, + { + "id": 18, + "seek": 7684, + "start": 88.02, + "end": 95.14, + "text": " Et ce rapport, si j'en crois Nicolas, serait caractérisé par un mélange de dépendance et de rejet.", + "tokens": [ + 3790, + 1769, + 18018, + 11, + 1511, + 361, + 6, + 268, + 21724, + 38268, + 11, + 23139, + 1032, + 578, + 4198, + 22118, + 971, + 517, + 41953, + 933, + 368, + 45768, + 719, + 1030, + 368, + 319, + 7108, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.06937986261704389, + "compression_ratio": 1.6787003610108304, + "no_speech_prob": 5.948771558905719e-06, + "confidence": 0.972, + "words": [ + { + "text": "Et", + "start": 88.02, + "end": 88.48, + "confidence": 0.992 + }, + { + "text": "ce", + "start": 88.48, + "end": 88.86, + "confidence": 0.975 + }, + { + "text": "rapport,", + "start": 88.86, + "end": 89.28, + "confidence": 0.998 + }, + { + "text": "si", + "start": 89.28, + "end": 89.56, + "confidence": 0.999 + }, + { + "text": "j'en", + "start": 89.56, + "end": 89.84, + "confidence": 0.996 + }, + { + "text": "crois", + "start": 89.84, + "end": 89.88, + "confidence": 0.984 + }, + { + "text": "Nicolas,", + "start": 89.88, + "end": 90.54, + "confidence": 0.681 + }, + { + "text": "serait", + "start": 90.54, + "end": 90.94, + "confidence": 0.885 + }, + { + "text": "caractérisé", + "start": 90.94, + "end": 91.8, + "confidence": 0.993 + }, + { + "text": "par", + "start": 91.8, + "end": 92.12, + "confidence": 0.997 + }, + { + "text": "un", + "start": 92.12, + "end": 92.44, + "confidence": 0.997 + }, + { + "text": "mélange", + "start": 92.44, + "end": 92.98, + "confidence": 0.999 + }, + { + "text": "de", + "start": 92.98, + "end": 93.4, + "confidence": 0.998 + }, + { + "text": "dépendance", + "start": 93.4, + "end": 94.24, + "confidence": 0.953 + }, + { + "text": "et", + "start": 94.24, + "end": 94.54, + "confidence": 0.998 + }, + { + "text": "de", + "start": 94.54, + "end": 94.68, + "confidence": 0.999 + }, + { + "text": "rejet.", + "start": 94.68, + "end": 95.14, + "confidence": 0.993 + } + ] + }, + { + "id": 19, + "seek": 7684, + "start": 95.78, + "end": 102.86, + "text": " Bon, en vrai, il faudrait remonter très très finement toute l'histoire des objets techniques et de leur insertion dans nos vies", + "tokens": [ + 7368, + 11, + 465, + 17815, + 11, + 1930, + 38694, + 8645, + 890, + 41806, + 5732, + 5732, + 962, + 1712, + 14953, + 287, + 6, + 29093, + 730, + 1111, + 25349, + 7512, + 1030, + 368, + 9580, + 8969, + 313, + 2680, + 3269, + 371, + 530 + ], + "temperature": 0.0, + "avg_logprob": -0.06937986261704389, + "compression_ratio": 1.6787003610108304, + "no_speech_prob": 5.948771558905719e-06, + "confidence": 0.941, + "words": [ + { + "text": "Bon,", + "start": 95.78, + "end": 96.38, + "confidence": 0.792 + }, + { + "text": "en", + "start": 96.38, + "end": 96.52, + "confidence": 0.998 + }, + { + "text": "vrai,", + "start": 96.52, + "end": 97.14, + "confidence": 0.994 + }, + { + "text": "il", + "start": 97.14, + "end": 97.18, + "confidence": 0.998 + }, + { + "text": "faudrait", + "start": 97.18, + "end": 97.58, + "confidence": 0.997 + }, + { + "text": "remonter", + "start": 97.58, + "end": 98.08, + "confidence": 0.997 + }, + { + "text": "très", + "start": 98.08, + "end": 98.6, + "confidence": 0.997 + }, + { + "text": "très", + "start": 98.6, + "end": 98.7, + "confidence": 0.768 + }, + { + "text": "finement", + "start": 98.7, + "end": 99.32, + "confidence": 0.849 + }, + { + "text": "toute", + "start": 99.32, + "end": 99.7, + "confidence": 0.984 + }, + { + "text": "l'histoire", + "start": 99.7, + "end": 100.06, + "confidence": 0.997 + }, + { + "text": "des", + "start": 100.06, + "end": 100.24, + "confidence": 0.998 + }, + { + "text": "objets", + "start": 100.24, + "end": 100.48, + "confidence": 0.999 + }, + { + "text": "techniques", + "start": 100.48, + "end": 101.02, + "confidence": 0.984 + }, + { + "text": "et", + "start": 101.02, + "end": 101.48, + "confidence": 0.527 + }, + { + "text": "de", + "start": 101.48, + "end": 101.68, + "confidence": 0.994 + }, + { + "text": "leur", + "start": 101.68, + "end": 101.84, + "confidence": 0.833 + }, + { + "text": "insertion", + "start": 101.84, + "end": 102.32, + "confidence": 0.994 + }, + { + "text": "dans", + "start": 102.32, + "end": 102.48, + "confidence": 0.99 + }, + { + "text": "nos", + "start": 102.48, + "end": 102.66, + "confidence": 0.998 + }, + { + "text": "vies", + "start": 102.66, + "end": 102.86, + "confidence": 0.998 + } + ] + }, + { + "id": 20, + "seek": 7684, + "start": 102.9, + "end": 105.74, + "text": " pour déterminer si ce rapport est totalement inédit.", + "tokens": [ + 2016, + 2795, + 29725, + 260, + 1511, + 1769, + 18018, + 871, + 45203, + 294, + 7811, + 270, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.06937986261704389, + "compression_ratio": 1.6787003610108304, + "no_speech_prob": 5.948771558905719e-06, + "confidence": 0.981, + "words": [ + { + "text": "pour", + "start": 102.9, + "end": 103.06, + "confidence": 0.822 + }, + { + "text": "déterminer", + "start": 103.06, + "end": 103.66, + "confidence": 0.997 + }, + { + "text": "si", + "start": 103.66, + "end": 103.76, + "confidence": 0.992 + }, + { + "text": "ce", + "start": 103.76, + "end": 103.94, + "confidence": 0.997 + }, + { + "text": "rapport", + "start": 103.94, + "end": 104.26, + "confidence": 0.997 + }, + { + "text": "est", + "start": 104.26, + "end": 104.74, + "confidence": 0.998 + }, + { + "text": "totalement", + "start": 104.74, + "end": 105.3, + "confidence": 0.999 + }, + { + "text": "inédit.", + "start": 105.3, + "end": 105.74, + "confidence": 0.999 + } + ] + }, + { + "id": 21, + "seek": 10584, + "start": 106.1, + "end": 109.34, + "text": " Mais j'ai l'impression comme ça que Nicolas ne se trompe pas vraiment.", + "tokens": [ + 6313, + 361, + 6, + 1301, + 287, + 6, + 36107, + 5173, + 2788, + 631, + 38268, + 408, + 369, + 504, + 298, + 494, + 1736, + 8322, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.07386374800172571, + "compression_ratio": 1.685512367491166, + "no_speech_prob": 5.46344235772267e-05, + "confidence": 0.94, + "words": [ + { + "text": "Mais", + "start": 106.1, + "end": 106.36, + "confidence": 0.947 + }, + { + "text": "j'ai", + "start": 106.36, + "end": 106.92, + "confidence": 0.941 + }, + { + "text": "l'impression", + "start": 106.92, + "end": 107.36, + "confidence": 0.996 + }, + { + "text": "comme", + "start": 107.36, + "end": 107.56, + "confidence": 0.641 + }, + { + "text": "ça", + "start": 107.56, + "end": 107.82, + "confidence": 0.978 + }, + { + "text": "que", + "start": 107.82, + "end": 107.96, + "confidence": 0.976 + }, + { + "text": "Nicolas", + "start": 107.96, + "end": 108.46, + "confidence": 0.985 + }, + { + "text": "ne", + "start": 108.46, + "end": 108.66, + "confidence": 0.726 + }, + { + "text": "se", + "start": 108.66, + "end": 108.7, + "confidence": 0.991 + }, + { + "text": "trompe", + "start": 108.7, + "end": 108.88, + "confidence": 0.995 + }, + { + "text": "pas", + "start": 108.88, + "end": 109.08, + "confidence": 0.999 + }, + { + "text": "vraiment.", + "start": 109.08, + "end": 109.34, + "confidence": 0.991 + } + ] + }, + { + "id": 22, + "seek": 10584, + "start": 109.88, + "end": 114.98, + "text": " Pour autant que je sache, il y a eu plein de discussions autour de la voiture ou même du téléphone.", + "tokens": [ + 8732, + 34081, + 631, + 1506, + 262, + 6000, + 11, + 1930, + 288, + 257, + 2228, + 21088, + 368, + 11088, + 30249, + 368, + 635, + 38859, + 2820, + 5698, + 1581, + 47159, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.07386374800172571, + "compression_ratio": 1.685512367491166, + "no_speech_prob": 5.46344235772267e-05, + "confidence": 0.969, + "words": [ + { + "text": "Pour", + "start": 109.88, + "end": 110.08, + "confidence": 0.997 + }, + { + "text": "autant", + "start": 110.08, + "end": 110.24, + "confidence": 1.0 + }, + { + "text": "que", + "start": 110.24, + "end": 110.42, + "confidence": 0.988 + }, + { + "text": "je", + "start": 110.42, + "end": 110.52, + "confidence": 0.998 + }, + { + "text": "sache,", + "start": 110.52, + "end": 111.14, + "confidence": 0.963 + }, + { + "text": "il", + "start": 111.14, + "end": 111.18, + "confidence": 0.997 + }, + { + "text": "y", + "start": 111.18, + "end": 111.32, + "confidence": 0.992 + }, + { + "text": "a", + "start": 111.32, + "end": 111.36, + "confidence": 0.993 + }, + { + "text": "eu", + "start": 111.36, + "end": 111.68, + "confidence": 0.998 + }, + { + "text": "plein", + "start": 111.68, + "end": 111.88, + "confidence": 0.974 + }, + { + "text": "de", + "start": 111.88, + "end": 112.06, + "confidence": 0.997 + }, + { + "text": "discussions", + "start": 112.06, + "end": 112.6, + "confidence": 0.799 + }, + { + "text": "autour", + "start": 112.6, + "end": 112.94, + "confidence": 0.995 + }, + { + "text": "de", + "start": 112.94, + "end": 113.46, + "confidence": 0.997 + }, + { + "text": "la", + "start": 113.46, + "end": 113.52, + "confidence": 0.998 + }, + { + "text": "voiture", + "start": 113.52, + "end": 113.86, + "confidence": 1.0 + }, + { + "text": "ou", + "start": 113.86, + "end": 114.06, + "confidence": 0.765 + }, + { + "text": "même", + "start": 114.06, + "end": 114.44, + "confidence": 0.996 + }, + { + "text": "du", + "start": 114.44, + "end": 114.6, + "confidence": 0.995 + }, + { + "text": "téléphone.", + "start": 114.6, + "end": 114.98, + "confidence": 0.999 + } + ] + }, + { + "id": 23, + "seek": 10584, + "start": 115.34, + "end": 119.84, + "text": " Mais la dépendance n'était pas du même ordre. Donc le rejet non plus n'était pas du même ordre.", + "tokens": [ + 6313, + 635, + 45768, + 719, + 297, + 6, + 9743, + 1736, + 1581, + 5698, + 4792, + 265, + 13, + 7477, + 476, + 319, + 7108, + 2107, + 1804, + 297, + 6, + 9743, + 1736, + 1581, + 5698, + 4792, + 265, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.07386374800172571, + "compression_ratio": 1.685512367491166, + "no_speech_prob": 5.46344235772267e-05, + "confidence": 0.972, + "words": [ + { + "text": "Mais", + "start": 115.34, + "end": 115.72, + "confidence": 0.994 + }, + { + "text": "la", + "start": 115.72, + "end": 116.02, + "confidence": 0.937 + }, + { + "text": "dépendance", + "start": 116.02, + "end": 116.4, + "confidence": 0.997 + }, + { + "text": "n'était", + "start": 116.4, + "end": 116.62, + "confidence": 0.994 + }, + { + "text": "pas", + "start": 116.62, + "end": 117.0, + "confidence": 0.998 + }, + { + "text": "du", + "start": 117.0, + "end": 117.16, + "confidence": 0.995 + }, + { + "text": "même", + "start": 117.16, + "end": 117.46, + "confidence": 0.999 + }, + { + "text": "ordre.", + "start": 117.46, + "end": 117.78, + "confidence": 0.999 + }, + { + "text": "Donc", + "start": 117.78, + "end": 117.98, + "confidence": 0.804 + }, + { + "text": "le", + "start": 117.98, + "end": 118.34, + "confidence": 0.715 + }, + { + "text": "rejet", + "start": 118.34, + "end": 118.62, + "confidence": 0.999 + }, + { + "text": "non", + "start": 118.62, + "end": 118.78, + "confidence": 0.975 + }, + { + "text": "plus", + "start": 118.78, + "end": 118.94, + "confidence": 0.996 + }, + { + "text": "n'était", + "start": 118.94, + "end": 119.12, + "confidence": 0.987 + }, + { + "text": "pas", + "start": 119.12, + "end": 119.3, + "confidence": 0.998 + }, + { + "text": "du", + "start": 119.3, + "end": 119.38, + "confidence": 0.995 + }, + { + "text": "même", + "start": 119.38, + "end": 119.56, + "confidence": 0.999 + }, + { + "text": "ordre.", + "start": 119.56, + "end": 119.84, + "confidence": 0.999 + } + ] + }, + { + "id": 24, + "seek": 10584, + "start": 119.98, + "end": 123.02, + "text": " On peut adorer sa bagnole, en avoir besoin pour plein de choses.", + "tokens": [ + 1282, + 5977, + 614, + 17618, + 601, + 3411, + 1771, + 306, + 11, + 465, + 10853, + 19207, + 2016, + 21088, + 368, + 14488, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.07386374800172571, + "compression_ratio": 1.685512367491166, + "no_speech_prob": 5.46344235772267e-05, + "confidence": 0.991, + "words": [ + { + "text": "On", + "start": 119.98, + "end": 120.18, + "confidence": 0.996 + }, + { + "text": "peut", + "start": 120.18, + "end": 120.38, + "confidence": 0.997 + }, + { + "text": "adorer", + "start": 120.38, + "end": 120.66, + "confidence": 0.99 + }, + { + "text": "sa", + "start": 120.66, + "end": 120.88, + "confidence": 0.985 + }, + { + "text": "bagnole,", + "start": 120.88, + "end": 121.46, + "confidence": 0.984 + }, + { + "text": "en", + "start": 121.46, + "end": 121.56, + "confidence": 0.989 + }, + { + "text": "avoir", + "start": 121.56, + "end": 121.74, + "confidence": 0.998 + }, + { + "text": "besoin", + "start": 121.74, + "end": 122.1, + "confidence": 0.999 + }, + { + "text": "pour", + "start": 122.1, + "end": 122.34, + "confidence": 0.987 + }, + { + "text": "plein", + "start": 122.34, + "end": 122.68, + "confidence": 0.989 + }, + { + "text": "de", + "start": 122.68, + "end": 122.8, + "confidence": 0.998 + }, + { + "text": "choses.", + "start": 122.8, + "end": 123.02, + "confidence": 0.989 + } + ] + }, + { + "id": 25, + "seek": 10584, + "start": 123.28, + "end": 126.36, + "text": " Et bien, le soir, quand on va se coucher, on la laisse.", + "tokens": [ + 3790, + 3610, + 11, + 476, + 27105, + 11, + 6932, + 322, + 2773, + 369, + 1384, + 6759, + 11, + 322, + 635, + 30969, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.07386374800172571, + "compression_ratio": 1.685512367491166, + "no_speech_prob": 5.46344235772267e-05, + "confidence": 0.895, + "words": [ + { + "text": "Et", + "start": 123.28, + "end": 123.46, + "confidence": 0.667 + }, + { + "text": "bien,", + "start": 123.46, + "end": 123.86, + "confidence": 0.469 + }, + { + "text": "le", + "start": 123.86, + "end": 123.98, + "confidence": 0.996 + }, + { + "text": "soir,", + "start": 123.98, + "end": 124.68, + "confidence": 0.999 + }, + { + "text": "quand", + "start": 124.68, + "end": 124.9, + "confidence": 0.997 + }, + { + "text": "on", + "start": 124.9, + "end": 125.02, + "confidence": 0.998 + }, + { + "text": "va", + "start": 125.02, + "end": 125.14, + "confidence": 0.996 + }, + { + "text": "se", + "start": 125.14, + "end": 125.38, + "confidence": 0.988 + }, + { + "text": "coucher,", + "start": 125.38, + "end": 125.8, + "confidence": 0.987 + }, + { + "text": "on", + "start": 125.8, + "end": 126.02, + "confidence": 0.995 + }, + { + "text": "la", + "start": 126.02, + "end": 126.22, + "confidence": 0.802 + }, + { + "text": "laisse.", + "start": 126.22, + "end": 126.36, + "confidence": 0.999 + } + ] + }, + { + "id": 26, + "seek": 10584, + "start": 126.98, + "end": 130.48, + "text": " On ne l'a pas dans la main quand on est au lit, on ne l'emmène pas au chiottes.", + "tokens": [ + 1282, + 408, + 287, + 6, + 64, + 1736, + 2680, + 635, + 2135, + 6932, + 322, + 871, + 1609, + 7997, + 11, + 322, + 408, + 287, + 6, + 443, + 76, + 18832, + 1736, + 1609, + 13228, + 1521, + 279, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.07386374800172571, + "compression_ratio": 1.685512367491166, + "no_speech_prob": 5.46344235772267e-05, + "confidence": 0.914, + "words": [ + { + "text": "On", + "start": 126.98, + "end": 127.32, + "confidence": 0.954 + }, + { + "text": "ne", + "start": 127.32, + "end": 127.36, + "confidence": 0.803 + }, + { + "text": "l'a", + "start": 127.36, + "end": 127.48, + "confidence": 0.974 + }, + { + "text": "pas", + "start": 127.48, + "end": 127.68, + "confidence": 0.999 + }, + { + "text": "dans", + "start": 127.68, + "end": 127.8, + "confidence": 0.996 + }, + { + "text": "la", + "start": 127.8, + "end": 128.06, + "confidence": 0.994 + }, + { + "text": "main", + "start": 128.06, + "end": 128.26, + "confidence": 0.999 + }, + { + "text": "quand", + "start": 128.26, + "end": 128.44, + "confidence": 0.935 + }, + { + "text": "on", + "start": 128.44, + "end": 128.62, + "confidence": 0.997 + }, + { + "text": "est", + "start": 128.62, + "end": 128.68, + "confidence": 0.993 + }, + { + "text": "au", + "start": 128.68, + "end": 129.04, + "confidence": 0.984 + }, + { + "text": "lit,", + "start": 129.04, + "end": 129.14, + "confidence": 0.999 + }, + { + "text": "on", + "start": 129.14, + "end": 129.26, + "confidence": 0.427 + }, + { + "text": "ne", + "start": 129.26, + "end": 129.3, + "confidence": 0.963 + }, + { + "text": "l'emmène", + "start": 129.3, + "end": 129.5, + "confidence": 0.992 + }, + { + "text": "pas", + "start": 129.5, + "end": 129.68, + "confidence": 0.997 + }, + { + "text": "au", + "start": 129.68, + "end": 129.86, + "confidence": 0.674 + }, + { + "text": "chiottes.", + "start": 129.86, + "end": 130.48, + "confidence": 0.828 + } + ] + }, + { + "id": 27, + "seek": 13084, + "start": 130.86, + "end": 136.9, + "text": " On pouvait être énervé par son môme qui occupait la ligne de téléphone pendant une heure chaque soir pour discuter avec un copain.", + "tokens": [ + 1282, + 45913, + 7418, + 45045, + 15797, + 971, + 1872, + 275, + 2851, + 1398, + 1956, + 8073, + 1001, + 635, + 34207, + 368, + 47159, + 17338, + 2251, + 30027, + 18920, + 27105, + 2016, + 2983, + 20314, + 4163, + 517, + 2971, + 491, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.06199159333200166, + "compression_ratio": 1.6127167630057804, + "no_speech_prob": 1.6126719856401905e-05, + "confidence": 0.955, + "words": [ + { + "text": "On", + "start": 130.86, + "end": 131.04, + "confidence": 0.983 + }, + { + "text": "pouvait", + "start": 131.04, + "end": 131.28, + "confidence": 0.989 + }, + { + "text": "être", + "start": 131.28, + "end": 131.48, + "confidence": 0.996 + }, + { + "text": "énervé", + "start": 131.48, + "end": 132.22, + "confidence": 0.906 + }, + { + "text": "par", + "start": 132.22, + "end": 132.44, + "confidence": 0.991 + }, + { + "text": "son", + "start": 132.44, + "end": 132.7, + "confidence": 0.998 + }, + { + "text": "môme", + "start": 132.7, + "end": 133.1, + "confidence": 0.832 + }, + { + "text": "qui", + "start": 133.1, + "end": 133.34, + "confidence": 0.919 + }, + { + "text": "occupait", + "start": 133.34, + "end": 133.76, + "confidence": 0.991 + }, + { + "text": "la", + "start": 133.76, + "end": 133.8, + "confidence": 0.992 + }, + { + "text": "ligne", + "start": 133.8, + "end": 134.08, + "confidence": 0.999 + }, + { + "text": "de", + "start": 134.08, + "end": 134.14, + "confidence": 0.997 + }, + { + "text": "téléphone", + "start": 134.14, + "end": 134.6, + "confidence": 0.985 + }, + { + "text": "pendant", + "start": 134.6, + "end": 134.82, + "confidence": 0.981 + }, + { + "text": "une", + "start": 134.82, + "end": 135.2, + "confidence": 0.87 + }, + { + "text": "heure", + "start": 135.2, + "end": 135.36, + "confidence": 0.998 + }, + { + "text": "chaque", + "start": 135.36, + "end": 135.54, + "confidence": 0.991 + }, + { + "text": "soir", + "start": 135.54, + "end": 135.8, + "confidence": 0.996 + }, + { + "text": "pour", + "start": 135.8, + "end": 135.96, + "confidence": 0.79 + }, + { + "text": "discuter", + "start": 135.96, + "end": 136.28, + "confidence": 0.997 + }, + { + "text": "avec", + "start": 136.28, + "end": 136.48, + "confidence": 0.996 + }, + { + "text": "un", + "start": 136.48, + "end": 136.6, + "confidence": 0.999 + }, + { + "text": "copain.", + "start": 136.6, + "end": 136.9, + "confidence": 0.998 + } + ] + }, + { + "id": 28, + "seek": 13084, + "start": 137.28, + "end": 141.88, + "text": " Mais ça ne ressemblait pas à ce qu'on peut ressentir à voir ce même môme aujourd'hui,", + "tokens": [ + 6313, + 2788, + 408, + 725, + 15750, + 35235, + 1736, + 1531, + 1769, + 421, + 6, + 266, + 5977, + 24689, + 317, + 347, + 1531, + 10695, + 1769, + 5698, + 275, + 2851, + 1398, + 14023, + 6, + 10556, + 11 + ], + "temperature": 0.0, + "avg_logprob": -0.06199159333200166, + "compression_ratio": 1.6127167630057804, + "no_speech_prob": 1.6126719856401905e-05, + "confidence": 0.959, + "words": [ + { + "text": "Mais", + "start": 137.28, + "end": 137.46, + "confidence": 0.993 + }, + { + "text": "ça", + "start": 137.46, + "end": 137.68, + "confidence": 0.938 + }, + { + "text": "ne", + "start": 137.68, + "end": 137.94, + "confidence": 0.998 + }, + { + "text": "ressemblait", + "start": 137.94, + "end": 138.4, + "confidence": 0.991 + }, + { + "text": "pas", + "start": 138.4, + "end": 138.76, + "confidence": 0.995 + }, + { + "text": "à", + "start": 138.76, + "end": 138.94, + "confidence": 0.988 + }, + { + "text": "ce", + "start": 138.94, + "end": 138.98, + "confidence": 0.998 + }, + { + "text": "qu'on", + "start": 138.98, + "end": 139.1, + "confidence": 0.986 + }, + { + "text": "peut", + "start": 139.1, + "end": 139.48, + "confidence": 0.988 + }, + { + "text": "ressentir", + "start": 139.48, + "end": 140.12, + "confidence": 0.997 + }, + { + "text": "à", + "start": 140.12, + "end": 140.32, + "confidence": 0.498 + }, + { + "text": "voir", + "start": 140.32, + "end": 140.46, + "confidence": 0.855 + }, + { + "text": "ce", + "start": 140.46, + "end": 140.68, + "confidence": 0.989 + }, + { + "text": "même", + "start": 140.68, + "end": 140.94, + "confidence": 0.984 + }, + { + "text": "môme", + "start": 140.94, + "end": 141.34, + "confidence": 0.998 + }, + { + "text": "aujourd'hui,", + "start": 141.34, + "end": 141.88, + "confidence": 0.988 + } + ] + }, + { + "id": 29, + "seek": 13084, + "start": 142.14, + "end": 146.3, + "text": " continuellement avec son smartphone dans la main, comme si c'était une sorte de pacemaker externe,", + "tokens": [ + 2354, + 285, + 1712, + 4163, + 1872, + 13307, + 2680, + 635, + 2135, + 11, + 5173, + 1511, + 269, + 6, + 9743, + 2251, + 25559, + 368, + 15165, + 49523, + 454, + 391, + 716, + 11 + ], + "temperature": 0.0, + "avg_logprob": -0.06199159333200166, + "compression_ratio": 1.6127167630057804, + "no_speech_prob": 1.6126719856401905e-05, + "confidence": 0.963, + "words": [ + { + "text": "continuellement", + "start": 142.14, + "end": 142.94, + "confidence": 0.971 + }, + { + "text": "avec", + "start": 142.94, + "end": 143.18, + "confidence": 0.805 + }, + { + "text": "son", + "start": 143.18, + "end": 143.38, + "confidence": 0.995 + }, + { + "text": "smartphone", + "start": 143.38, + "end": 143.76, + "confidence": 0.978 + }, + { + "text": "dans", + "start": 143.76, + "end": 143.94, + "confidence": 0.979 + }, + { + "text": "la", + "start": 143.94, + "end": 144.0, + "confidence": 0.996 + }, + { + "text": "main,", + "start": 144.0, + "end": 144.36, + "confidence": 0.998 + }, + { + "text": "comme", + "start": 144.36, + "end": 144.52, + "confidence": 0.835 + }, + { + "text": "si", + "start": 144.52, + "end": 144.64, + "confidence": 0.975 + }, + { + "text": "c'était", + "start": 144.64, + "end": 144.82, + "confidence": 0.991 + }, + { + "text": "une", + "start": 144.82, + "end": 145.06, + "confidence": 0.989 + }, + { + "text": "sorte", + "start": 145.06, + "end": 145.22, + "confidence": 0.997 + }, + { + "text": "de", + "start": 145.22, + "end": 145.3, + "confidence": 0.982 + }, + { + "text": "pacemaker", + "start": 145.3, + "end": 145.82, + "confidence": 0.917 + }, + { + "text": "externe,", + "start": 145.82, + "end": 146.3, + "confidence": 0.992 + } + ] + }, + { + "id": 30, + "seek": 13084, + "start": 146.34, + "end": 148.84, + "text": " comme si le lâcher allait entraîner sa mort immédiate.", + "tokens": [ + 5173, + 1511, + 476, + 48835, + 6759, + 439, + 1001, + 22284, + 7517, + 1193, + 601, + 6599, + 3397, + 526, + 4504, + 473, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.06199159333200166, + "compression_ratio": 1.6127167630057804, + "no_speech_prob": 1.6126719856401905e-05, + "confidence": 0.989, + "words": [ + { + "text": "comme", + "start": 146.34, + "end": 146.58, + "confidence": 0.996 + }, + { + "text": "si", + "start": 146.58, + "end": 146.76, + "confidence": 0.994 + }, + { + "text": "le", + "start": 146.76, + "end": 146.84, + "confidence": 0.997 + }, + { + "text": "lâcher", + "start": 146.84, + "end": 147.36, + "confidence": 0.969 + }, + { + "text": "allait", + "start": 147.36, + "end": 147.56, + "confidence": 0.993 + }, + { + "text": "entraîner", + "start": 147.56, + "end": 147.86, + "confidence": 0.978 + }, + { + "text": "sa", + "start": 147.86, + "end": 148.0, + "confidence": 0.999 + }, + { + "text": "mort", + "start": 148.0, + "end": 148.22, + "confidence": 0.998 + }, + { + "text": "immédiate.", + "start": 148.22, + "end": 148.84, + "confidence": 0.997 + } + ] + }, + { + "id": 31, + "seek": 13084, + "start": 149.04, + "end": 151.96, + "text": " Bon, je dis ça pour le môme, mais c'est évidemment valable pour nous aussi.", + "tokens": [ + 7368, + 11, + 1506, + 717, + 2788, + 2016, + 476, + 275, + 2851, + 1398, + 11, + 2420, + 269, + 6, + 377, + 24724, + 1323, + 712, + 2016, + 4666, + 6212, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.06199159333200166, + "compression_ratio": 1.6127167630057804, + "no_speech_prob": 1.6126719856401905e-05, + "confidence": 0.974, + "words": [ + { + "text": "Bon,", + "start": 149.04, + "end": 149.28, + "confidence": 0.918 + }, + { + "text": "je", + "start": 149.28, + "end": 149.32, + "confidence": 0.934 + }, + { + "text": "dis", + "start": 149.32, + "end": 149.46, + "confidence": 0.988 + }, + { + "text": "ça", + "start": 149.46, + "end": 149.64, + "confidence": 0.994 + }, + { + "text": "pour", + "start": 149.64, + "end": 149.74, + "confidence": 0.997 + }, + { + "text": "le", + "start": 149.74, + "end": 149.88, + "confidence": 0.995 + }, + { + "text": "môme,", + "start": 149.88, + "end": 150.32, + "confidence": 0.998 + }, + { + "text": "mais", + "start": 150.32, + "end": 150.52, + "confidence": 0.791 + }, + { + "text": "c'est", + "start": 150.52, + "end": 150.82, + "confidence": 0.981 + }, + { + "text": "évidemment", + "start": 150.82, + "end": 151.14, + "confidence": 0.98 + }, + { + "text": "valable", + "start": 151.14, + "end": 151.48, + "confidence": 0.998 + }, + { + "text": "pour", + "start": 151.48, + "end": 151.62, + "confidence": 0.997 + }, + { + "text": "nous", + "start": 151.62, + "end": 151.76, + "confidence": 0.999 + }, + { + "text": "aussi.", + "start": 151.76, + "end": 151.96, + "confidence": 0.996 + } + ] + }, + { + "id": 32, + "seek": 13084, + "start": 152.34, + "end": 158.22, + "text": " Donc, rapport inédit. D'accord. Mais pourquoi a-t-on l'impression qu'on n'en sortira jamais?", + "tokens": [ + 7477, + 11, + 18018, + 294, + 7811, + 270, + 13, + 413, + 6, + 19947, + 13, + 6313, + 19934, + 257, + 12, + 83, + 12, + 266, + 287, + 6, + 36107, + 421, + 6, + 266, + 297, + 6, + 268, + 1333, + 4271, + 14540, + 2506 + ], + "temperature": 0.0, + "avg_logprob": -0.06199159333200166, + "compression_ratio": 1.6127167630057804, + "no_speech_prob": 1.6126719856401905e-05, + "confidence": 0.948, + "words": [ + { + "text": "Donc,", + "start": 152.34, + "end": 153.46, + "confidence": 0.991 + }, + { + "text": "rapport", + "start": 153.46, + "end": 153.66, + "confidence": 0.976 + }, + { + "text": "inédit.", + "start": 153.66, + "end": 154.24, + "confidence": 0.996 + }, + { + "text": "D'accord.", + "start": 154.24, + "end": 155.48, + "confidence": 0.978 + }, + { + "text": "Mais", + "start": 155.48, + "end": 155.82, + "confidence": 0.557 + }, + { + "text": "pourquoi", + "start": 155.82, + "end": 156.32, + "confidence": 0.994 + }, + { + "text": "a-t-on", + "start": 156.32, + "end": 156.68, + "confidence": 0.94 + }, + { + "text": "l'impression", + "start": 156.68, + "end": 157.06, + "confidence": 0.999 + }, + { + "text": "qu'on", + "start": 157.06, + "end": 157.26, + "confidence": 0.995 + }, + { + "text": "n'en", + "start": 157.26, + "end": 157.44, + "confidence": 0.878 + }, + { + "text": "sortira", + "start": 157.44, + "end": 157.9, + "confidence": 0.989 + }, + { + "text": "jamais?", + "start": 157.9, + "end": 158.22, + "confidence": 0.998 + } + ] + }, + { + "id": 33, + "seek": 15884, + "start": 158.86, + "end": 165.32, + "text": " Est-ce qu'il faut en remettre la faute sur les gens qui ont créé cet outil merveilleux et diabolique, et diabolique parce que merveilleux?", + "tokens": [ + 4410, + 12, + 384, + 421, + 6, + 388, + 8487, + 465, + 890, + 40681, + 635, + 2050, + 1169, + 1022, + 1512, + 10668, + 1956, + 6592, + 15609, + 526, + 8603, + 484, + 388, + 3551, + 303, + 3409, + 2449, + 1030, + 1026, + 14923, + 1925, + 11, + 1030, + 1026, + 14923, + 1925, + 6992, + 631, + 3551, + 303, + 3409, + 2449, + 2506 + ], + "temperature": 0.0, + "avg_logprob": -0.079788723507443, + "compression_ratio": 1.6517857142857142, + "no_speech_prob": 5.4980162531137466e-05, + "confidence": 0.962, + "words": [ + { + "text": "Est-ce", + "start": 158.86, + "end": 159.34, + "confidence": 0.981 + }, + { + "text": "qu'il", + "start": 159.34, + "end": 159.46, + "confidence": 0.997 + }, + { + "text": "faut", + "start": 159.46, + "end": 159.62, + "confidence": 0.999 + }, + { + "text": "en", + "start": 159.62, + "end": 159.78, + "confidence": 0.97 + }, + { + "text": "remettre", + "start": 159.78, + "end": 160.12, + "confidence": 0.999 + }, + { + "text": "la", + "start": 160.12, + "end": 160.34, + "confidence": 0.998 + }, + { + "text": "faute", + "start": 160.34, + "end": 160.66, + "confidence": 0.986 + }, + { + "text": "sur", + "start": 160.66, + "end": 160.94, + "confidence": 0.995 + }, + { + "text": "les", + "start": 160.94, + "end": 161.28, + "confidence": 0.995 + }, + { + "text": "gens", + "start": 161.28, + "end": 161.44, + "confidence": 1.0 + }, + { + "text": "qui", + "start": 161.44, + "end": 161.58, + "confidence": 0.984 + }, + { + "text": "ont", + "start": 161.58, + "end": 161.72, + "confidence": 0.998 + }, + { + "text": "créé", + "start": 161.72, + "end": 162.3, + "confidence": 0.99 + }, + { + "text": "cet", + "start": 162.3, + "end": 162.46, + "confidence": 0.852 + }, + { + "text": "outil", + "start": 162.46, + "end": 162.78, + "confidence": 0.99 + }, + { + "text": "merveilleux", + "start": 162.78, + "end": 163.34, + "confidence": 0.994 + }, + { + "text": "et", + "start": 163.34, + "end": 163.5, + "confidence": 0.954 + }, + { + "text": "diabolique,", + "start": 163.5, + "end": 163.86, + "confidence": 0.992 + }, + { + "text": "et", + "start": 163.86, + "end": 163.92, + "confidence": 0.54 + }, + { + "text": "diabolique", + "start": 163.92, + "end": 164.4, + "confidence": 0.951 + }, + { + "text": "parce", + "start": 164.4, + "end": 164.66, + "confidence": 0.703 + }, + { + "text": "que", + "start": 164.66, + "end": 164.84, + "confidence": 0.99 + }, + { + "text": "merveilleux?", + "start": 164.84, + "end": 165.32, + "confidence": 0.997 + } + ] + }, + { + "id": 34, + "seek": 15884, + "start": 166.34, + "end": 168.82, + "text": " Les économistes parlent de dépendance du sentier.", + "tokens": [ + 6965, + 31171, + 22368, + 13734, + 317, + 368, + 45768, + 719, + 1581, + 2279, + 811, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.079788723507443, + "compression_ratio": 1.6517857142857142, + "no_speech_prob": 5.4980162531137466e-05, + "confidence": 0.984, + "words": [ + { + "text": "Les", + "start": 166.34, + "end": 167.04, + "confidence": 0.926 + }, + { + "text": "économistes", + "start": 167.04, + "end": 167.48, + "confidence": 0.998 + }, + { + "text": "parlent", + "start": 167.48, + "end": 167.68, + "confidence": 0.995 + }, + { + "text": "de", + "start": 167.68, + "end": 167.82, + "confidence": 0.995 + }, + { + "text": "dépendance", + "start": 167.82, + "end": 168.36, + "confidence": 0.985 + }, + { + "text": "du", + "start": 168.36, + "end": 168.5, + "confidence": 0.997 + }, + { + "text": "sentier.", + "start": 168.5, + "end": 168.82, + "confidence": 0.978 + } + ] + }, + { + "id": 35, + "seek": 16884, + "start": 168.86, + "end": 177.42, + "text": " C'est l'idée qu'on est sur un sentier qui a été établi, soit volontairement en marchant dessus, soit en définissant des bornes, en définissant une signalétique.", + "tokens": [ + 50364, + 383, + 6, + 377, + 287, + 6, + 34281, + 421, + 6, + 266, + 871, + 1022, + 517, + 2279, + 811, + 1956, + 257, + 8862, + 4823, + 455, + 2081, + 11, + 12703, + 40005, + 9020, + 518, + 465, + 8368, + 394, + 30677, + 11, + 12703, + 465, + 40763, + 29492, + 730, + 4232, + 279, + 11, + 465, + 40763, + 29492, + 2251, + 6358, + 42379, + 13, + 51414 + ], + "temperature": 0.0, + "avg_logprob": -0.10415018598238628, + "compression_ratio": 1.3916666666666666, + "no_speech_prob": 3.958350498578511e-05, + "confidence": 0.93, + "words": [ + { + "text": "C'est", + "start": 168.86, + "end": 169.1, + "confidence": 0.952 + }, + { + "text": "l'idée", + "start": 169.1, + "end": 169.34, + "confidence": 0.992 + }, + { + "text": "qu'on", + "start": 169.34, + "end": 169.7, + "confidence": 0.825 + }, + { + "text": "est", + "start": 169.7, + "end": 169.88, + "confidence": 0.631 + }, + { + "text": "sur", + "start": 169.88, + "end": 170.0, + "confidence": 0.993 + }, + { + "text": "un", + "start": 170.0, + "end": 170.54, + "confidence": 0.998 + }, + { + "text": "sentier", + "start": 170.54, + "end": 170.78, + "confidence": 0.99 + }, + { + "text": "qui", + "start": 170.78, + "end": 170.84, + "confidence": 0.961 + }, + { + "text": "a", + "start": 170.84, + "end": 170.94, + "confidence": 0.98 + }, + { + "text": "été", + "start": 170.94, + "end": 171.12, + "confidence": 0.996 + }, + { + "text": "établi,", + "start": 171.12, + "end": 171.9, + "confidence": 0.995 + }, + { + "text": "soit", + "start": 171.9, + "end": 172.12, + "confidence": 0.989 + }, + { + "text": "volontairement", + "start": 172.12, + "end": 172.72, + "confidence": 0.965 + }, + { + "text": "en", + "start": 172.72, + "end": 172.8, + "confidence": 0.941 + }, + { + "text": "marchant", + "start": 172.8, + "end": 173.06, + "confidence": 0.997 + }, + { + "text": "dessus,", + "start": 173.06, + "end": 174.24, + "confidence": 0.972 + }, + { + "text": "soit", + "start": 174.24, + "end": 174.92, + "confidence": 0.996 + }, + { + "text": "en", + "start": 174.92, + "end": 175.36, + "confidence": 0.991 + }, + { + "text": "définissant", + "start": 175.36, + "end": 175.5, + "confidence": 0.983 + }, + { + "text": "des", + "start": 175.5, + "end": 175.76, + "confidence": 0.984 + }, + { + "text": "bornes,", + "start": 175.76, + "end": 176.04, + "confidence": 0.975 + }, + { + "text": "en", + "start": 176.04, + "end": 176.08, + "confidence": 0.68 + }, + { + "text": "définissant", + "start": 176.08, + "end": 176.58, + "confidence": 0.997 + }, + { + "text": "une", + "start": 176.58, + "end": 176.82, + "confidence": 0.944 + }, + { + "text": "signalétique.", + "start": 176.82, + "end": 177.42, + "confidence": 0.642 + } + ] + } + ], + "language": "fr" +} \ No newline at end of file diff --git a/tests/expected/medium_fr/bonjour.wav.words.json b/tests/expected/medium_fr/bonjour.wav.words.json new file mode 100644 index 0000000000000000000000000000000000000000..1539b7c83897fb3c4c929768b3ef7782d28c3f37 --- /dev/null +++ b/tests/expected/medium_fr/bonjour.wav.words.json @@ -0,0 +1,32 @@ +{ + "text": " Bonjour !", + "segments": [ + { + "id": 0, + "seek": 0, + "start": 0.14, + "end": 0.94, + "text": " Bonjour !", + "tokens": [ + 50364, + 25431, + 2298, + 50402 + ], + "temperature": 0.0, + "avg_logprob": -0.7046648502349854, + "compression_ratio": 0.5294117647058824, + "no_speech_prob": 0.08610370755195618, + "confidence": 0.964, + "words": [ + { + "text": "Bonjour !", + "start": 0.14, + "end": 0.94, + "confidence": 0.964 + } + ] + } + ], + "language": "fr" +} \ No newline at end of file diff --git a/tests/expected/medium_fr/bonjour_vous_allez_bien.mp3.words.json b/tests/expected/medium_fr/bonjour_vous_allez_bien.mp3.words.json new file mode 100644 index 0000000000000000000000000000000000000000..08b0c5b49b0b16bb75f05209f83a47dced01f458 --- /dev/null +++ b/tests/expected/medium_fr/bonjour_vous_allez_bien.mp3.words.json @@ -0,0 +1,134 @@ +{ + "text": " Bonjour ! Est-ce que vous allez bien ? Bonjour ! Est-ce que vous allez bien ?", + "segments": [ + { + "id": 0, + "seek": 0, + "start": 0.42, + "end": 3.46, + "text": " Bonjour ! Est-ce que vous allez bien ?", + "tokens": [ + 50364, + 25431, + 2298, + 4410, + 12, + 384, + 631, + 2630, + 18146, + 3610, + 2506, + 50564 + ], + "temperature": 0.0, + "avg_logprob": -0.3616434610806979, + "compression_ratio": 0.8260869565217391, + "no_speech_prob": 0.07169149070978165, + "confidence": 0.936, + "words": [ + { + "text": "Bonjour !", + "start": 0.42, + "end": 1.92, + "confidence": 0.874 + }, + { + "text": "Est-ce", + "start": 1.92, + "end": 2.16, + "confidence": 0.885 + }, + { + "text": "que", + "start": 2.16, + "end": 2.24, + "confidence": 0.988 + }, + { + "text": "vous", + "start": 2.24, + "end": 2.38, + "confidence": 0.996 + }, + { + "text": "allez", + "start": 2.38, + "end": 2.58, + "confidence": 0.99 + }, + { + "text": "bien ?", + "start": 2.58, + "end": 3.46, + "confidence": 0.999 + } + ] + }, + { + "id": 1, + "seek": 3000, + "start": 32.94, + "end": 35.86, + "text": " Bonjour ! Est-ce que vous allez bien ?", + "tokens": [ + 50364, + 25431, + 2298, + 4410, + 12, + 384, + 631, + 2630, + 18146, + 3610, + 2506, + 50664 + ], + "temperature": 0.0, + "avg_logprob": -0.30651259422302246, + "compression_ratio": 0.8260869565217391, + "no_speech_prob": 0.40451279282569885, + "confidence": 0.933, + "words": [ + { + "text": "Bonjour !", + "start": 32.94, + "end": 34.44, + "confidence": 0.741 + }, + { + "text": "Est-ce", + "start": 34.44, + "end": 34.7, + "confidence": 0.921 + }, + { + "text": "que", + "start": 34.7, + "end": 34.76, + "confidence": 0.996 + }, + { + "text": "vous", + "start": 34.76, + "end": 34.9, + "confidence": 0.998 + }, + { + "text": "allez", + "start": 34.9, + "end": 35.1, + "confidence": 0.997 + }, + { + "text": "bien ?", + "start": 35.1, + "end": 35.86, + "confidence": 0.999 + } + ] + } + ], + "language": "fr" +} \ No newline at end of file diff --git a/tests/expected/medium_fr/empty.mp3.words.json b/tests/expected/medium_fr/empty.mp3.words.json new file mode 100644 index 0000000000000000000000000000000000000000..47a1595fd330caa6c2c345a710e711d889a3f382 --- /dev/null +++ b/tests/expected/medium_fr/empty.mp3.words.json @@ -0,0 +1,31 @@ +{ + "text": " ...", + "segments": [ + { + "id": 0, + "seek": 0, + "start": 0.08, + "end": 1.58, + "text": " ...", + "tokens": [ + 50364, + 1097, + 50518 + ], + "temperature": 0.0, + "avg_logprob": -0.8880113959312439, + "compression_ratio": 0.2727272727272727, + "no_speech_prob": 0.43768733739852905, + "confidence": 0.128, + "words": [ + { + "text": "...", + "start": 0.08, + "end": 1.58, + "confidence": 0.128 + } + ] + } + ], + "language": "fr" +} \ No newline at end of file diff --git a/tests/expected/medium_fr/gaenswein15.mp3.words.json b/tests/expected/medium_fr/gaenswein15.mp3.words.json new file mode 100644 index 0000000000000000000000000000000000000000..95a2283ba53201569be582ec5261ce28bb185973 --- /dev/null +++ b/tests/expected/medium_fr/gaenswein15.mp3.words.json @@ -0,0 +1,31 @@ +{ + "text": " ...", + "segments": [ + { + "id": 0, + "seek": 0, + "start": 0.0, + "end": 8.46, + "text": " ...", + "tokens": [ + 50364, + 1097, + 51122 + ], + "temperature": 0.0, + "avg_logprob": -1.0786787271499634, + "compression_ratio": 0.2727272727272727, + "no_speech_prob": 0.2541781961917877, + "confidence": 0.133, + "words": [ + { + "text": "...", + "start": 0.0, + "end": 8.46, + "confidence": 0.133 + } + ] + } + ], + "language": "fr" +} \ No newline at end of file diff --git a/tests/expected/medium_fr/gloria.mp3.words.json b/tests/expected/medium_fr/gloria.mp3.words.json new file mode 100644 index 0000000000000000000000000000000000000000..492ca53823a9f27db55911658859392f74a909f8 --- /dev/null +++ b/tests/expected/medium_fr/gloria.mp3.words.json @@ -0,0 +1,31 @@ +{ + "text": " ...", + "segments": [ + { + "id": 0, + "seek": 0, + "start": 20.18, + "end": 20.2, + "text": " ...", + "tokens": [ + 50364, + 1097, + 51392 + ], + "temperature": 0.0, + "avg_logprob": -1.4416182041168213, + "compression_ratio": 0.2727272727272727, + "no_speech_prob": 0.05016394704580307, + "confidence": 0.158, + "words": [ + { + "text": "...", + "start": 20.18, + "end": 20.2, + "confidence": 0.158 + } + ] + } + ], + "language": "fr" +} \ No newline at end of file diff --git a/tests/expected/medium_fr/laugh1.mp3.words.json b/tests/expected/medium_fr/laugh1.mp3.words.json new file mode 100644 index 0000000000000000000000000000000000000000..982601e67e3c8090e3078fea82fcd7caff43daef --- /dev/null +++ b/tests/expected/medium_fr/laugh1.mp3.words.json @@ -0,0 +1,32 @@ +{ + "text": " Rires", + "segments": [ + { + "id": 0, + "seek": 0, + "start": 0.0, + "end": 1.7, + "text": " Rires", + "tokens": [ + 50364, + 497, + 3145, + 50576 + ], + "temperature": 0.0, + "avg_logprob": -1.057028102874756, + "compression_ratio": 0.38461538461538464, + "no_speech_prob": 0.5899588465690613, + "confidence": 0.254, + "words": [ + { + "text": "Rires", + "start": 0.0, + "end": 1.7, + "confidence": 0.254 + } + ] + } + ], + "language": "fr" +} \ No newline at end of file diff --git a/tests/expected/medium_fr/laugh2.mp3.words.json b/tests/expected/medium_fr/laugh2.mp3.words.json new file mode 100644 index 0000000000000000000000000000000000000000..fcbde787e9d6c24115a59dccde034b48cdaa5a0c --- /dev/null +++ b/tests/expected/medium_fr/laugh2.mp3.words.json @@ -0,0 +1,32 @@ +{ + "text": " Hehehe", + "segments": [ + { + "id": 0, + "seek": 0, + "start": 0.22, + "end": 0.64, + "text": " Hehehe", + "tokens": [ + 50364, + 634, + 23500, + 50398 + ], + "temperature": 0.0, + "avg_logprob": -1.2401897430419921, + "compression_ratio": 0.5, + "no_speech_prob": 0.3699853718280792, + "confidence": 0.173, + "words": [ + { + "text": "Hehehe", + "start": 0.22, + "end": 0.64, + "confidence": 0.173 + } + ] + } + ], + "language": "fr" +} \ No newline at end of file diff --git a/tests/expected/medium_fr/punctuations.mp3.words.json b/tests/expected/medium_fr/punctuations.mp3.words.json new file mode 100644 index 0000000000000000000000000000000000000000..ea6d774cf345132b175fedfe5a717c4cd27cc3aa --- /dev/null +++ b/tests/expected/medium_fr/punctuations.mp3.words.json @@ -0,0 +1,68 @@ +{ + "text": " Dis-moi, est-ce que l'avion vole ?", + "segments": [ + { + "id": 0, + "seek": 0, + "start": 0.38, + "end": 2.76, + "text": " Dis-moi, est-ce que l'avion vole ?", + "tokens": [ + 50364, + 4208, + 12, + 29292, + 11, + 871, + 12, + 384, + 631, + 287, + 6, + 706, + 313, + 49877, + 2506, + 50496 + ], + "temperature": 0.0, + "avg_logprob": -0.26327380012063417, + "compression_ratio": 0.8095238095238095, + "no_speech_prob": 0.03882359713315964, + "confidence": 0.928, + "words": [ + { + "text": "Dis-moi,", + "start": 0.38, + "end": 1.1, + "confidence": 0.809 + }, + { + "text": "est-ce", + "start": 1.28, + "end": 1.5, + "confidence": 0.968 + }, + { + "text": "que", + "start": 1.5, + "end": 1.66, + "confidence": 0.978 + }, + { + "text": "l'avion", + "start": 1.66, + "end": 2.04, + "confidence": 0.993 + }, + { + "text": "vole ?", + "start": 2.04, + "end": 2.76, + "confidence": 0.898 + } + ] + } + ], + "language": "fr" +} \ No newline at end of file diff --git a/tests/expected/medium_fr/radio_short.mp3.words.json b/tests/expected/medium_fr/radio_short.mp3.words.json new file mode 100644 index 0000000000000000000000000000000000000000..44dd933b03beec4ddff2fb3dcdf5e15abf6dec1e --- /dev/null +++ b/tests/expected/medium_fr/radio_short.mp3.words.json @@ -0,0 +1,1642 @@ +{ + "text": " Le plus important au poker ce ne sont pas les cartes, c'est ce que vous en faites. Winamax, la référence du poker en ligne. Bonsoir à toutes et tous, vous êtes sur BFM TV, nous sommes en direct, c'est bien sûr BFM story avec tout ce qui fait l'actualité. Durant 60 minutes ce sont des gros plans, des analyses, des réactions que nous vous proposons. Comment Eric Verth peut-il encore soutenir la réforme des retraites alors qu'il est englué dans sa propre affaire, l'affaire Verth-Bettancourt ? Question posée par les leaders de la CFDT et la CGT. Réponse de Nicolas Sarkozy, Eric Verth portera le débat sur les retraites, on en parle dans BFM story avec le numéro de la CFDT. Et puis il y a une bataille qui a démarré, celle entre Marine Le Pen et Bruno Gognich, la bataille de la succession de Jean-Marie Le Pen à la tête du Front National. La tournée de campagne de Marine Le Pen commence aujourd'hui dans le Var, Marine Le Pen sera en direct dans BFM story. Restez avec nous Marine Le Pen dans moins de 3 minutes, à tout de suite. ...", + "segments": [ + { + "id": 0, + "seek": 3000, + "start": 30.88, + "end": 34.26, + "text": " Le plus important au poker ce ne sont pas les cartes, c'est ce que vous en faites.", + "tokens": [ + 50364, + 1456, + 1804, + 1021, + 1609, + 36863, + 1769, + 408, + 4900, + 1736, + 1512, + 5467, + 279, + 11, + 269, + 6, + 377, + 1769, + 631, + 2630, + 465, + 29902, + 13, + 50664 + ], + "temperature": 0.0, + "avg_logprob": -0.19321525431124964, + "compression_ratio": 1.5084745762711864, + "no_speech_prob": 0.5535648465156555, + "confidence": 0.92, + "words": [ + { + "text": "Le", + "start": 30.88, + "end": 31.02, + "confidence": 0.534 + }, + { + "text": "plus", + "start": 31.02, + "end": 31.18, + "confidence": 0.99 + }, + { + "text": "important", + "start": 31.18, + "end": 31.5, + "confidence": 0.993 + }, + { + "text": "au", + "start": 31.5, + "end": 31.62, + "confidence": 0.946 + }, + { + "text": "poker", + "start": 31.62, + "end": 31.84, + "confidence": 0.992 + }, + { + "text": "ce", + "start": 31.84, + "end": 32.0, + "confidence": 0.583 + }, + { + "text": "ne", + "start": 32.0, + "end": 32.06, + "confidence": 0.961 + }, + { + "text": "sont", + "start": 32.06, + "end": 32.16, + "confidence": 0.991 + }, + { + "text": "pas", + "start": 32.16, + "end": 32.3, + "confidence": 0.991 + }, + { + "text": "les", + "start": 32.3, + "end": 32.46, + "confidence": 0.969 + }, + { + "text": "cartes,", + "start": 32.46, + "end": 33.26, + "confidence": 0.996 + }, + { + "text": "c'est", + "start": 33.48, + "end": 33.62, + "confidence": 0.95 + }, + { + "text": "ce", + "start": 33.62, + "end": 33.66, + "confidence": 0.99 + }, + { + "text": "que", + "start": 33.66, + "end": 33.76, + "confidence": 0.991 + }, + { + "text": "vous", + "start": 33.76, + "end": 33.9, + "confidence": 0.991 + }, + { + "text": "en", + "start": 33.9, + "end": 34.06, + "confidence": 0.982 + }, + { + "text": "faites.", + "start": 34.06, + "end": 34.26, + "confidence": 0.893 + } + ] + }, + { + "id": 1, + "seek": 3000, + "start": 36.26, + "end": 38.74, + "text": " Winamax, la référence du poker en ligne.", + "tokens": [ + 50664, + 10427, + 2404, + 87, + 11, + 635, + 30170, + 41635, + 1581, + 36863, + 465, + 34207, + 13, + 50814 + ], + "temperature": 0.0, + "avg_logprob": -0.19321525431124964, + "compression_ratio": 1.5084745762711864, + "no_speech_prob": 0.5535648465156555, + "confidence": 0.967, + "words": [ + { + "text": "Winamax,", + "start": 36.26, + "end": 37.04, + "confidence": 0.905 + }, + { + "text": "la", + "start": 37.26, + "end": 37.36, + "confidence": 0.988 + }, + { + "text": "référence", + "start": 37.36, + "end": 37.78, + "confidence": 0.998 + }, + { + "text": "du", + "start": 37.78, + "end": 37.96, + "confidence": 0.992 + }, + { + "text": "poker", + "start": 37.96, + "end": 38.22, + "confidence": 0.998 + }, + { + "text": "en", + "start": 38.22, + "end": 38.44, + "confidence": 0.993 + }, + { + "text": "ligne.", + "start": 38.44, + "end": 38.74, + "confidence": 0.993 + } + ] + }, + { + "id": 2, + "seek": 3000, + "start": 44.9, + "end": 51.38, + "text": " Bonsoir à toutes et tous, vous êtes sur BFM TV, nous sommes en direct, c'est bien sûr BFM story avec tout ce qui fait l'actualité.", + "tokens": [ + 51114, + 7368, + 539, + 347, + 1531, + 14437, + 1030, + 8317, + 11, + 2630, + 18935, + 1022, + 363, + 37, + 44, + 3558, + 11, + 4666, + 25232, + 465, + 2047, + 11, + 269, + 6, + 377, + 3610, + 18143, + 363, + 37, + 44, + 1657, + 4163, + 3486, + 1769, + 1956, + 3887, + 287, + 6, + 578, + 901, + 5066, + 13, + 51414 + ], + "temperature": 0.0, + "avg_logprob": -0.19321525431124964, + "compression_ratio": 1.5084745762711864, + "no_speech_prob": 0.5535648465156555, + "confidence": 0.907, + "words": [ + { + "text": "Bonsoir", + "start": 44.9, + "end": 45.42, + "confidence": 0.955 + }, + { + "text": "à", + "start": 45.42, + "end": 45.84, + "confidence": 0.542 + }, + { + "text": "toutes", + "start": 45.84, + "end": 46.06, + "confidence": 0.916 + }, + { + "text": "et", + "start": 46.06, + "end": 46.26, + "confidence": 0.988 + }, + { + "text": "tous,", + "start": 46.26, + "end": 46.5, + "confidence": 0.981 + }, + { + "text": "vous", + "start": 46.6, + "end": 46.74, + "confidence": 0.97 + }, + { + "text": "êtes", + "start": 46.74, + "end": 46.88, + "confidence": 0.995 + }, + { + "text": "sur", + "start": 46.88, + "end": 47.1, + "confidence": 0.989 + }, + { + "text": "BFM", + "start": 47.1, + "end": 47.52, + "confidence": 0.987 + }, + { + "text": "TV,", + "start": 47.52, + "end": 47.72, + "confidence": 0.853 + }, + { + "text": "nous", + "start": 47.84, + "end": 47.92, + "confidence": 0.83 + }, + { + "text": "sommes", + "start": 47.92, + "end": 48.14, + "confidence": 0.988 + }, + { + "text": "en", + "start": 48.14, + "end": 48.28, + "confidence": 0.987 + }, + { + "text": "direct,", + "start": 48.28, + "end": 48.52, + "confidence": 0.998 + }, + { + "text": "c'est", + "start": 48.7, + "end": 48.76, + "confidence": 0.939 + }, + { + "text": "bien", + "start": 48.76, + "end": 48.98, + "confidence": 0.971 + }, + { + "text": "sûr", + "start": 48.98, + "end": 49.22, + "confidence": 0.906 + }, + { + "text": "BFM", + "start": 49.22, + "end": 49.82, + "confidence": 0.949 + }, + { + "text": "story", + "start": 49.82, + "end": 50.04, + "confidence": 0.356 + }, + { + "text": "avec", + "start": 50.04, + "end": 50.26, + "confidence": 0.551 + }, + { + "text": "tout", + "start": 50.26, + "end": 50.42, + "confidence": 0.931 + }, + { + "text": "ce", + "start": 50.42, + "end": 50.52, + "confidence": 0.995 + }, + { + "text": "qui", + "start": 50.52, + "end": 50.58, + "confidence": 0.952 + }, + { + "text": "fait", + "start": 50.58, + "end": 50.72, + "confidence": 0.961 + }, + { + "text": "l'actualité.", + "start": 50.72, + "end": 51.38, + "confidence": 0.994 + } + ] + }, + { + "id": 3, + "seek": 3000, + "start": 51.96, + "end": 56.22, + "text": " Durant 60 minutes ce sont des gros plans, des analyses, des réactions que nous vous proposons.", + "tokens": [ + 51414, + 13710, + 394, + 4060, + 2077, + 1769, + 4900, + 730, + 18638, + 5482, + 11, + 730, + 37560, + 11, + 730, + 3960, + 12299, + 631, + 4666, + 2630, + 7532, + 892, + 13, + 51664 + ], + "temperature": 0.0, + "avg_logprob": -0.19321525431124964, + "compression_ratio": 1.5084745762711864, + "no_speech_prob": 0.5535648465156555, + "confidence": 0.947, + "words": [ + { + "text": "Durant", + "start": 51.96, + "end": 52.32, + "confidence": 0.935 + }, + { + "text": "60", + "start": 52.32, + "end": 52.76, + "confidence": 0.922 + }, + { + "text": "minutes", + "start": 52.76, + "end": 53.08, + "confidence": 0.912 + }, + { + "text": "ce", + "start": 53.08, + "end": 53.28, + "confidence": 0.748 + }, + { + "text": "sont", + "start": 53.28, + "end": 53.62, + "confidence": 0.979 + }, + { + "text": "des", + "start": 53.62, + "end": 53.84, + "confidence": 0.99 + }, + { + "text": "gros", + "start": 53.84, + "end": 54.06, + "confidence": 0.969 + }, + { + "text": "plans,", + "start": 54.06, + "end": 54.2, + "confidence": 0.958 + }, + { + "text": "des", + "start": 54.32, + "end": 54.44, + "confidence": 0.986 + }, + { + "text": "analyses,", + "start": 54.44, + "end": 54.68, + "confidence": 0.914 + }, + { + "text": "des", + "start": 54.78, + "end": 54.86, + "confidence": 0.995 + }, + { + "text": "réactions", + "start": 54.86, + "end": 55.22, + "confidence": 0.996 + }, + { + "text": "que", + "start": 55.22, + "end": 55.4, + "confidence": 0.881 + }, + { + "text": "nous", + "start": 55.4, + "end": 55.52, + "confidence": 0.947 + }, + { + "text": "vous", + "start": 55.52, + "end": 55.78, + "confidence": 0.99 + }, + { + "text": "proposons.", + "start": 55.78, + "end": 56.22, + "confidence": 0.991 + } + ] + }, + { + "id": 4, + "seek": 5600, + "start": 56.66, + "end": 64.23, + "text": " Comment Eric Verth peut-il encore soutenir la réforme des retraites alors qu'il est englué dans sa propre affaire, l'affaire Verth-Bettancourt ?", + "tokens": [ + 50364, + 16328, + 9336, + 4281, + 392, + 5977, + 12, + 388, + 10122, + 29350, + 268, + 347, + 635, + 3960, + 44562, + 730, + 49356, + 3324, + 11246, + 421, + 6, + 388, + 871, + 1741, + 2781, + 526, + 2680, + 601, + 35221, + 2096, + 9020, + 11, + 287, + 6, + 2518, + 9020, + 4281, + 392, + 12, + 33, + 3093, + 4463, + 33403, + 2506, + 50764 + ], + "temperature": 0.0, + "avg_logprob": -0.13355242821478075, + "compression_ratio": 1.573667711598746, + "no_speech_prob": 0.4252333343029022, + "confidence": 0.854, + "words": [ + { + "text": "Comment", + "start": 56.66, + "end": 56.96, + "confidence": 0.944 + }, + { + "text": "Eric", + "start": 56.96, + "end": 57.2, + "confidence": 0.877 + }, + { + "text": "Verth", + "start": 57.2, + "end": 57.36, + "confidence": 0.369 + }, + { + "text": "peut-il", + "start": 57.36, + "end": 57.8, + "confidence": 0.947 + }, + { + "text": "encore", + "start": 57.8, + "end": 58.22, + "confidence": 0.954 + }, + { + "text": "soutenir", + "start": 58.22, + "end": 58.62, + "confidence": 0.997 + }, + { + "text": "la", + "start": 58.62, + "end": 58.76, + "confidence": 0.977 + }, + { + "text": "réforme", + "start": 58.76, + "end": 59.2, + "confidence": 0.996 + }, + { + "text": "des", + "start": 59.2, + "end": 59.42, + "confidence": 0.992 + }, + { + "text": "retraites", + "start": 59.42, + "end": 59.76, + "confidence": 0.99 + }, + { + "text": "alors", + "start": 59.76, + "end": 59.98, + "confidence": 0.492 + }, + { + "text": "qu'il", + "start": 59.98, + "end": 60.74, + "confidence": 0.959 + }, + { + "text": "est", + "start": 60.74, + "end": 60.9, + "confidence": 0.973 + }, + { + "text": "englué", + "start": 60.9, + "end": 61.7, + "confidence": 0.945 + }, + { + "text": "dans", + "start": 61.7, + "end": 61.96, + "confidence": 0.961 + }, + { + "text": "sa", + "start": 61.96, + "end": 62.44, + "confidence": 0.848 + }, + { + "text": "propre", + "start": 62.44, + "end": 62.68, + "confidence": 0.992 + }, + { + "text": "affaire,", + "start": 62.68, + "end": 62.94, + "confidence": 0.993 + }, + { + "text": "l'affaire", + "start": 63.02, + "end": 63.3, + "confidence": 0.909 + }, + { + "text": "Verth-Bettancourt ?", + "start": 63.3, + "end": 64.23, + "confidence": 0.711 + } + ] + }, + { + "id": 5, + "seek": 5600, + "start": 64.23, + "end": 67.18, + "text": " Question posée par les leaders de la CFDT et la CGT.", + "tokens": [ + 50764, + 14464, + 1366, + 3856, + 971, + 1512, + 3523, + 368, + 635, + 21792, + 35, + 51, + 1030, + 635, + 38007, + 51, + 13, + 50914 + ], + "temperature": 0.0, + "avg_logprob": -0.13355242821478075, + "compression_ratio": 1.573667711598746, + "no_speech_prob": 0.4252333343029022, + "confidence": 0.895, + "words": [ + { + "text": "Question", + "start": 64.23, + "end": 64.34, + "confidence": 0.63 + }, + { + "text": "posée", + "start": 64.34, + "end": 64.74, + "confidence": 0.977 + }, + { + "text": "par", + "start": 64.74, + "end": 64.96, + "confidence": 0.988 + }, + { + "text": "les", + "start": 64.96, + "end": 65.12, + "confidence": 0.965 + }, + { + "text": "leaders", + "start": 65.12, + "end": 65.66, + "confidence": 0.977 + }, + { + "text": "de", + "start": 65.66, + "end": 65.92, + "confidence": 0.986 + }, + { + "text": "la", + "start": 65.92, + "end": 66.1, + "confidence": 0.967 + }, + { + "text": "CFDT", + "start": 66.1, + "end": 66.52, + "confidence": 0.994 + }, + { + "text": "et", + "start": 66.52, + "end": 66.6, + "confidence": 0.606 + }, + { + "text": "la", + "start": 66.6, + "end": 66.74, + "confidence": 0.609 + }, + { + "text": "CGT.", + "start": 66.74, + "end": 67.18, + "confidence": 0.987 + } + ] + }, + { + "id": 6, + "seek": 5600, + "start": 67.5, + "end": 76.38, + "text": " Réponse de Nicolas Sarkozy, Eric Verth portera le débat sur les retraites, on en parle dans BFM story avec le numéro de la CFDT.", + "tokens": [ + 50914, + 41587, + 3739, + 368, + 38268, + 318, + 809, + 78, + 1229, + 11, + 9336, + 4281, + 392, + 1515, + 23833, + 476, + 2795, + 11980, + 1022, + 1512, + 49356, + 3324, + 11, + 322, + 465, + 18508, + 2680, + 363, + 37, + 44, + 1657, + 4163, + 476, + 49525, + 368, + 635, + 21792, + 35, + 51, + 13, + 51364 + ], + "temperature": 0.0, + "avg_logprob": -0.13355242821478075, + "compression_ratio": 1.573667711598746, + "no_speech_prob": 0.4252333343029022, + "confidence": 0.968, + "words": [ + { + "text": "Réponse", + "start": 67.5, + "end": 67.96, + "confidence": 0.947 + }, + { + "text": "de", + "start": 67.96, + "end": 68.14, + "confidence": 0.962 + }, + { + "text": "Nicolas", + "start": 68.14, + "end": 68.38, + "confidence": 0.931 + }, + { + "text": "Sarkozy,", + "start": 68.38, + "end": 68.88, + "confidence": 0.987 + }, + { + "text": "Eric", + "start": 68.98, + "end": 69.24, + "confidence": 0.962 + }, + { + "text": "Verth", + "start": 69.24, + "end": 69.84, + "confidence": 0.986 + }, + { + "text": "portera", + "start": 69.84, + "end": 70.44, + "confidence": 0.966 + }, + { + "text": "le", + "start": 70.44, + "end": 71.06, + "confidence": 0.989 + }, + { + "text": "débat", + "start": 71.06, + "end": 71.46, + "confidence": 0.996 + }, + { + "text": "sur", + "start": 71.46, + "end": 71.7, + "confidence": 0.988 + }, + { + "text": "les", + "start": 71.7, + "end": 71.88, + "confidence": 0.997 + }, + { + "text": "retraites,", + "start": 71.88, + "end": 72.26, + "confidence": 0.997 + }, + { + "text": "on", + "start": 72.36, + "end": 72.5, + "confidence": 0.865 + }, + { + "text": "en", + "start": 72.5, + "end": 72.68, + "confidence": 0.951 + }, + { + "text": "parle", + "start": 72.68, + "end": 73.1, + "confidence": 0.996 + }, + { + "text": "dans", + "start": 73.1, + "end": 73.56, + "confidence": 0.981 + }, + { + "text": "BFM", + "start": 73.56, + "end": 74.46, + "confidence": 0.991 + }, + { + "text": "story", + "start": 74.46, + "end": 74.76, + "confidence": 0.761 + }, + { + "text": "avec", + "start": 74.76, + "end": 75.12, + "confidence": 0.845 + }, + { + "text": "le", + "start": 75.12, + "end": 75.32, + "confidence": 0.982 + }, + { + "text": "numéro", + "start": 75.32, + "end": 75.54, + "confidence": 0.997 + }, + { + "text": "de", + "start": 75.54, + "end": 75.76, + "confidence": 0.996 + }, + { + "text": "la", + "start": 75.76, + "end": 75.9, + "confidence": 0.987 + }, + { + "text": "CFDT.", + "start": 75.9, + "end": 76.38, + "confidence": 0.998 + } + ] + }, + { + "id": 7, + "seek": 5600, + "start": 76.8, + "end": 83.04, + "text": " Et puis il y a une bataille qui a démarré, celle entre Marine Le Pen et Bruno Gognich, la bataille de la succession de Jean-Marie Le Pen à la tête du Front National.", + "tokens": [ + 51364, + 3790, + 9093, + 1930, + 288, + 257, + 2251, + 272, + 3274, + 3409, + 1956, + 257, + 22761, + 2284, + 526, + 11, + 25722, + 3962, + 20415, + 1456, + 10571, + 1030, + 23046, + 460, + 2912, + 480, + 11, + 635, + 272, + 3274, + 3409, + 368, + 635, + 36624, + 368, + 13854, + 12, + 16639, + 414, + 1456, + 10571, + 1531, + 635, + 24661, + 1581, + 17348, + 4862, + 13, + 51714 + ], + "temperature": 0.0, + "avg_logprob": -0.13355242821478075, + "compression_ratio": 1.573667711598746, + "no_speech_prob": 0.4252333343029022, + "confidence": 0.871, + "words": [ + { + "text": "Et", + "start": 76.8, + "end": 76.96, + "confidence": 0.883 + }, + { + "text": "puis", + "start": 76.96, + "end": 77.06, + "confidence": 0.952 + }, + { + "text": "il", + "start": 77.06, + "end": 77.18, + "confidence": 0.792 + }, + { + "text": "y", + "start": 77.18, + "end": 77.2, + "confidence": 0.995 + }, + { + "text": "a", + "start": 77.2, + "end": 77.22, + "confidence": 0.986 + }, + { + "text": "une", + "start": 77.22, + "end": 77.28, + "confidence": 0.995 + }, + { + "text": "bataille", + "start": 77.28, + "end": 77.56, + "confidence": 0.996 + }, + { + "text": "qui", + "start": 77.56, + "end": 77.72, + "confidence": 0.997 + }, + { + "text": "a", + "start": 77.72, + "end": 77.76, + "confidence": 0.985 + }, + { + "text": "démarré,", + "start": 77.76, + "end": 78.16, + "confidence": 0.988 + }, + { + "text": "celle", + "start": 78.24, + "end": 78.4, + "confidence": 0.997 + }, + { + "text": "entre", + "start": 78.4, + "end": 78.64, + "confidence": 0.975 + }, + { + "text": "Marine", + "start": 78.64, + "end": 78.94, + "confidence": 0.987 + }, + { + "text": "Le", + "start": 78.94, + "end": 79.12, + "confidence": 0.986 + }, + { + "text": "Pen", + "start": 79.12, + "end": 79.18, + "confidence": 0.986 + }, + { + "text": "et", + "start": 79.18, + "end": 79.34, + "confidence": 0.997 + }, + { + "text": "Bruno", + "start": 79.34, + "end": 79.54, + "confidence": 0.986 + }, + { + "text": "Gognich,", + "start": 79.54, + "end": 80.02, + "confidence": 0.239 + }, + { + "text": "la", + "start": 80.2, + "end": 80.32, + "confidence": 0.71 + }, + { + "text": "bataille", + "start": 80.32, + "end": 80.58, + "confidence": 0.998 + }, + { + "text": "de", + "start": 80.58, + "end": 80.72, + "confidence": 0.976 + }, + { + "text": "la", + "start": 80.72, + "end": 80.84, + "confidence": 0.987 + }, + { + "text": "succession", + "start": 80.84, + "end": 81.22, + "confidence": 0.982 + }, + { + "text": "de", + "start": 81.22, + "end": 81.44, + "confidence": 0.985 + }, + { + "text": "Jean-Marie", + "start": 81.44, + "end": 81.72, + "confidence": 0.95 + }, + { + "text": "Le", + "start": 81.72, + "end": 81.9, + "confidence": 0.996 + }, + { + "text": "Pen", + "start": 81.9, + "end": 82.0, + "confidence": 0.999 + }, + { + "text": "à", + "start": 82.0, + "end": 82.16, + "confidence": 0.977 + }, + { + "text": "la", + "start": 82.16, + "end": 82.22, + "confidence": 0.995 + }, + { + "text": "tête", + "start": 82.22, + "end": 82.32, + "confidence": 0.926 + }, + { + "text": "du", + "start": 82.32, + "end": 82.46, + "confidence": 0.997 + }, + { + "text": "Front", + "start": 82.46, + "end": 82.66, + "confidence": 0.777 + }, + { + "text": "National.", + "start": 82.66, + "end": 83.04, + "confidence": 0.822 + } + ] + }, + { + "id": 8, + "seek": 8300, + "start": 83.34, + "end": 88.88, + "text": " La tournée de campagne de Marine Le Pen commence aujourd'hui dans le Var, Marine Le Pen sera en direct dans BFM story.", + "tokens": [ + 50364, + 2369, + 3512, + 77, + 3856, + 368, + 2255, + 13887, + 368, + 20415, + 1456, + 10571, + 18137, + 14023, + 6, + 10556, + 2680, + 476, + 14662, + 11, + 20415, + 1456, + 10571, + 15021, + 465, + 2047, + 2680, + 363, + 37, + 44, + 1657, + 13, + 50664 + ], + "temperature": 0.0, + "avg_logprob": -0.1127048058943315, + "compression_ratio": 1.3591549295774648, + "no_speech_prob": 0.4064846634864807, + "confidence": 0.954, + "words": [ + { + "text": "La", + "start": 83.34, + "end": 83.68, + "confidence": 0.921 + }, + { + "text": "tournée", + "start": 83.68, + "end": 84.16, + "confidence": 0.994 + }, + { + "text": "de", + "start": 84.16, + "end": 84.48, + "confidence": 0.936 + }, + { + "text": "campagne", + "start": 84.48, + "end": 84.8, + "confidence": 0.981 + }, + { + "text": "de", + "start": 84.8, + "end": 84.98, + "confidence": 0.971 + }, + { + "text": "Marine", + "start": 84.98, + "end": 85.14, + "confidence": 0.997 + }, + { + "text": "Le", + "start": 85.14, + "end": 85.32, + "confidence": 0.997 + }, + { + "text": "Pen", + "start": 85.32, + "end": 85.44, + "confidence": 0.999 + }, + { + "text": "commence", + "start": 85.44, + "end": 85.8, + "confidence": 0.971 + }, + { + "text": "aujourd'hui", + "start": 85.8, + "end": 86.14, + "confidence": 0.988 + }, + { + "text": "dans", + "start": 86.14, + "end": 86.28, + "confidence": 0.979 + }, + { + "text": "le", + "start": 86.28, + "end": 86.46, + "confidence": 0.923 + }, + { + "text": "Var,", + "start": 86.46, + "end": 86.64, + "confidence": 0.533 + }, + { + "text": "Marine", + "start": 86.74, + "end": 86.96, + "confidence": 0.992 + }, + { + "text": "Le", + "start": 86.96, + "end": 87.12, + "confidence": 0.992 + }, + { + "text": "Pen", + "start": 87.12, + "end": 87.22, + "confidence": 0.999 + }, + { + "text": "sera", + "start": 87.22, + "end": 87.48, + "confidence": 0.989 + }, + { + "text": "en", + "start": 87.48, + "end": 87.76, + "confidence": 0.989 + }, + { + "text": "direct", + "start": 87.76, + "end": 88.04, + "confidence": 0.997 + }, + { + "text": "dans", + "start": 88.04, + "end": 88.34, + "confidence": 0.925 + }, + { + "text": "BFM", + "start": 88.34, + "end": 88.68, + "confidence": 0.996 + }, + { + "text": "story.", + "start": 88.68, + "end": 88.88, + "confidence": 0.831 + } + ] + }, + { + "id": 9, + "seek": 8300, + "start": 89.02, + "end": 92.28, + "text": " Restez avec nous Marine Le Pen dans moins de 3 minutes, à tout de suite.", + "tokens": [ + 50664, + 13094, + 4371, + 4163, + 4666, + 20415, + 1456, + 10571, + 2680, + 13099, + 368, + 805, + 2077, + 11, + 1531, + 3486, + 368, + 14205, + 13, + 50814 + ], + "temperature": 0.0, + "avg_logprob": -0.1127048058943315, + "compression_ratio": 1.3591549295774648, + "no_speech_prob": 0.4064846634864807, + "confidence": 0.936, + "words": [ + { + "text": "Restez", + "start": 89.02, + "end": 89.4, + "confidence": 0.967 + }, + { + "text": "avec", + "start": 89.4, + "end": 89.7, + "confidence": 0.997 + }, + { + "text": "nous", + "start": 89.7, + "end": 89.94, + "confidence": 0.956 + }, + { + "text": "Marine", + "start": 89.94, + "end": 90.24, + "confidence": 0.912 + }, + { + "text": "Le", + "start": 90.24, + "end": 90.52, + "confidence": 0.997 + }, + { + "text": "Pen", + "start": 90.52, + "end": 90.68, + "confidence": 0.999 + }, + { + "text": "dans", + "start": 90.68, + "end": 90.98, + "confidence": 0.843 + }, + { + "text": "moins", + "start": 90.98, + "end": 91.2, + "confidence": 0.992 + }, + { + "text": "de", + "start": 91.2, + "end": 91.34, + "confidence": 0.991 + }, + { + "text": "3", + "start": 91.34, + "end": 91.52, + "confidence": 0.595 + }, + { + "text": "minutes,", + "start": 91.52, + "end": 91.8, + "confidence": 0.985 + }, + { + "text": "à", + "start": 91.82, + "end": 91.98, + "confidence": 0.962 + }, + { + "text": "tout", + "start": 91.98, + "end": 92.1, + "confidence": 0.917 + }, + { + "text": "de", + "start": 92.1, + "end": 92.14, + "confidence": 0.999 + }, + { + "text": "suite.", + "start": 92.14, + "end": 92.28, + "confidence": 0.999 + } + ] + }, + { + "id": 10, + "seek": 9200, + "start": 92.28, + "end": 93.08, + "text": " ...", + "tokens": [ + 50364, + 1097, + 51064 + ], + "temperature": 0.0, + "avg_logprob": -0.6883202791213989, + "compression_ratio": 0.2727272727272727, + "no_speech_prob": 0.8045242428779602, + "confidence": 0.153, + "words": [ + { + "text": "...", + "start": 92.28, + "end": 93.08, + "confidence": 0.153 + } + ] + } + ], + "language": "fr" +} \ No newline at end of file diff --git a/tests/expected/medium_fr/smartphone.mp3.words.json b/tests/expected/medium_fr/smartphone.mp3.words.json new file mode 100644 index 0000000000000000000000000000000000000000..a51a598ad65798c6c7f09c9ee8eac752e218e74e --- /dev/null +++ b/tests/expected/medium_fr/smartphone.mp3.words.json @@ -0,0 +1,4899 @@ +{ + "text": " C'est évident ce que dit Nicolas, mais je ne me l'étais jamais formulé comme ça. Ce qui fait la force du smartphone, c'est pas seulement l'accumulation des fonctions, mais la manière dont elles interagissent entre elles. Ce qui dit d'ailleurs sur la photo, c'est hyper convaincant. Alors évidemment, il faudrait ajouter les interfaces. L'écran tactile a été beaucoup très souvent mentionné. Mais bon, il faut dire qu'il profite aussi de 20 ans pendant lesquels les ordinateurs nous ont appris à cliquer sur des icônes. Sauf que le smartphone ajoute le toucher, ce qui rend le contact plus direct, plus sensible. Et puis évidemment, il faudrait parler aussi des applications qui permettent de contourner le côté touffu de la navigation web pour aller directement au but. Bref, tout ça, ce sont les conditions qui permettent de créer cet objet dont Nicolas dit qu'il est vraisemblablement inédit dans l'histoire de l'humanité. Mais ça, ça soulève une autre interrogation. Est-ce que le fait que cet objet soit inédit induit que notre rapport à lui est aussi un rapport inédit ? Je veux dire, est-ce que le rapport qu'on a au smartphone est comparable à celui qu'on entretenait à d'autres objets techniques comme la voiture ou le téléphone ? Il n'y a pas d'équivalent en fait. Et donc cette espèce de nouveauté dans la relation à l'objet, c'est fascinant et terrifiant. Parce qu'on a l'impression, comme le disent les utilisateurs et les services, d'être dépendant de cet objet, d'induire en fait une espèce de relation, de médiation avec le monde qui rend de l'ampleur et qui amène aussi à des formes de rejet. Donc à objet inédit, rapport inédit. Et ce rapport, si j'en crois à Nicolas, serait caractérisé par un mélange de dépendance et de rejet. Bon, en vrai, il faudrait remonter très très finement toute l'histoire des objets techniques et de leur insertion dans nos vies pour déterminer si ce rapport est totalement inédit. Mais j'ai l'impression comme ça que Nicolas ne se trompe pas vraiment. Pour autant que je sache, il y a eu plein de discussions autour de la voiture ou même du téléphone. Mais la dépendance n'était pas du même ordre. Donc le rejet non plus n'était pas du même ordre. On peut adorer sa bagnole, en avoir besoin pour plein de choses. Le soir, quand on va se coucher, on la laisse. On ne l'a pas dans la main quand on est au lit, on ne l'emmène pas au chiottes. On pouvait être énervé par son môme qui occupait la ligne de téléphone pendant une heure chaque soir pour discuter avec un copain. Mais ça ne ressemblait pas à ce qu'on peut ressentir à voir ce même môme aujourd'hui, continuellement avec son smartphone dans la main, comme si c'était une sorte de pacemaker externe, comme si le lâcher allait entraîner sa mort immédiate. Bon, je dis ça pour le môme, mais c'est évidemment valable pour nous aussi. Donc, rapport inédit, d'accord. Mais pourquoi a-t-on l'impression qu'on n'en sortira jamais ? Est-ce qu'il faut en remettre la faute sur les gens qui ont créé cet outil merveilleux et diabolique, et diabolique parce que merveilleux ? Les économistes parlent de dépendance du sentier. C'est l'idée qu'on met sur un sentier qui a été établi, soit volontairement en marchant dessus, soit en définissant des bornes, en définissant une signalétique.", + "segments": [ + { + "id": 0, + "seek": 0, + "start": 0.4, + "end": 3.66, + "text": " C'est évident ce que dit Nicolas, mais je ne me l'étais jamais formulé comme ça.", + "tokens": [ + 50364, + 383, + 6, + 377, + 20090, + 1078, + 1769, + 631, + 6176, + 38268, + 11, + 2420, + 1506, + 408, + 385, + 287, + 6, + 22824, + 14540, + 49990, + 526, + 5173, + 2788, + 13, + 50539 + ], + "temperature": 0.0, + "avg_logprob": -0.2362650940749819, + "compression_ratio": 1.6238532110091743, + "no_speech_prob": 0.15368737280368805, + "confidence": 0.935, + "words": [ + { + "text": "C'est", + "start": 0.4, + "end": 0.64, + "confidence": 0.961 + }, + { + "text": "évident", + "start": 0.64, + "end": 0.9, + "confidence": 0.984 + }, + { + "text": "ce", + "start": 0.9, + "end": 1.0, + "confidence": 0.663 + }, + { + "text": "que", + "start": 1.0, + "end": 1.08, + "confidence": 0.989 + }, + { + "text": "dit", + "start": 1.08, + "end": 1.2, + "confidence": 0.994 + }, + { + "text": "Nicolas,", + "start": 1.2, + "end": 1.48, + "confidence": 0.91 + }, + { + "text": "mais", + "start": 1.7, + "end": 2.04, + "confidence": 0.979 + }, + { + "text": "je", + "start": 2.04, + "end": 2.26, + "confidence": 0.981 + }, + { + "text": "ne", + "start": 2.26, + "end": 2.34, + "confidence": 0.837 + }, + { + "text": "me", + "start": 2.34, + "end": 2.36, + "confidence": 0.821 + }, + { + "text": "l'étais", + "start": 2.36, + "end": 2.58, + "confidence": 0.971 + }, + { + "text": "jamais", + "start": 2.58, + "end": 2.88, + "confidence": 0.989 + }, + { + "text": "formulé", + "start": 2.88, + "end": 3.26, + "confidence": 0.908 + }, + { + "text": "comme", + "start": 3.26, + "end": 3.44, + "confidence": 0.993 + }, + { + "text": "ça.", + "start": 3.44, + "end": 3.66, + "confidence": 0.975 + } + ] + }, + { + "id": 1, + "seek": 0, + "start": 4.16, + "end": 7.94, + "text": " Ce qui fait la force du smartphone, c'est pas seulement l'accumulation des fonctions,", + "tokens": [ + 50549, + 8257, + 1956, + 3887, + 635, + 3464, + 1581, + 13307, + 11, + 269, + 6, + 377, + 1736, + 27772, + 287, + 6, + 8476, + 449, + 2776, + 730, + 17290, + 3916, + 11, + 50756 + ], + "temperature": 0.0, + "avg_logprob": -0.2362650940749819, + "compression_ratio": 1.6238532110091743, + "no_speech_prob": 0.15368737280368805, + "confidence": 0.93, + "words": [ + { + "text": "Ce", + "start": 4.16, + "end": 4.28, + "confidence": 0.952 + }, + { + "text": "qui", + "start": 4.28, + "end": 4.36, + "confidence": 0.958 + }, + { + "text": "fait", + "start": 4.36, + "end": 4.5, + "confidence": 0.567 + }, + { + "text": "la", + "start": 4.5, + "end": 4.76, + "confidence": 0.972 + }, + { + "text": "force", + "start": 4.76, + "end": 5.02, + "confidence": 0.999 + }, + { + "text": "du", + "start": 5.02, + "end": 5.22, + "confidence": 0.996 + }, + { + "text": "smartphone,", + "start": 5.22, + "end": 5.7, + "confidence": 0.912 + }, + { + "text": "c'est", + "start": 6.04, + "end": 6.16, + "confidence": 0.879 + }, + { + "text": "pas", + "start": 6.16, + "end": 6.26, + "confidence": 0.991 + }, + { + "text": "seulement", + "start": 6.26, + "end": 6.54, + "confidence": 0.999 + }, + { + "text": "l'accumulation", + "start": 6.54, + "end": 7.4, + "confidence": 0.958 + }, + { + "text": "des", + "start": 7.4, + "end": 7.58, + "confidence": 0.983 + }, + { + "text": "fonctions,", + "start": 7.58, + "end": 7.94, + "confidence": 0.987 + } + ] + }, + { + "id": 2, + "seek": 0, + "start": 8.32, + "end": 10.88, + "text": " mais la manière dont elles interagissent entre elles.", + "tokens": [ + 50756, + 2420, + 635, + 22267, + 9400, + 23576, + 728, + 559, + 25450, + 3962, + 23576, + 13, + 50906 + ], + "temperature": 0.0, + "avg_logprob": -0.2362650940749819, + "compression_ratio": 1.6238532110091743, + "no_speech_prob": 0.15368737280368805, + "confidence": 0.977, + "words": [ + { + "text": "mais", + "start": 8.32, + "end": 8.48, + "confidence": 0.992 + }, + { + "text": "la", + "start": 8.48, + "end": 8.7, + "confidence": 0.995 + }, + { + "text": "manière", + "start": 8.7, + "end": 8.94, + "confidence": 0.999 + }, + { + "text": "dont", + "start": 8.94, + "end": 9.08, + "confidence": 0.978 + }, + { + "text": "elles", + "start": 9.08, + "end": 9.48, + "confidence": 0.967 + }, + { + "text": "interagissent", + "start": 9.48, + "end": 10.38, + "confidence": 0.964 + }, + { + "text": "entre", + "start": 10.38, + "end": 10.7, + "confidence": 0.955 + }, + { + "text": "elles.", + "start": 10.7, + "end": 10.88, + "confidence": 0.989 + } + ] + }, + { + "id": 3, + "seek": 0, + "start": 10.96, + "end": 13.0, + "text": " Ce qui dit d'ailleurs sur la photo, c'est hyper convaincant.", + "tokens": [ + 50906, + 8257, + 1956, + 6176, + 274, + 6, + 19400, + 1022, + 635, + 5052, + 11, + 269, + 6, + 377, + 9848, + 3754, + 491, + 66, + 394, + 13, + 51006 + ], + "temperature": 0.0, + "avg_logprob": -0.2362650940749819, + "compression_ratio": 1.6238532110091743, + "no_speech_prob": 0.15368737280368805, + "confidence": 0.906, + "words": [ + { + "text": "Ce", + "start": 10.96, + "end": 11.16, + "confidence": 0.608 + }, + { + "text": "qui", + "start": 11.16, + "end": 11.26, + "confidence": 0.769 + }, + { + "text": "dit", + "start": 11.26, + "end": 11.38, + "confidence": 0.983 + }, + { + "text": "d'ailleurs", + "start": 11.38, + "end": 11.58, + "confidence": 0.985 + }, + { + "text": "sur", + "start": 11.58, + "end": 11.72, + "confidence": 0.48 + }, + { + "text": "la", + "start": 11.72, + "end": 11.82, + "confidence": 0.984 + }, + { + "text": "photo,", + "start": 11.82, + "end": 12.0, + "confidence": 0.994 + }, + { + "text": "c'est", + "start": 12.14, + "end": 12.2, + "confidence": 0.997 + }, + { + "text": "hyper", + "start": 12.2, + "end": 12.48, + "confidence": 0.993 + }, + { + "text": "convaincant.", + "start": 12.48, + "end": 13.0, + "confidence": 0.982 + } + ] + }, + { + "id": 4, + "seek": 0, + "start": 13.38, + "end": 16.04, + "text": " Alors évidemment, il faudrait ajouter les interfaces.", + "tokens": [ + 51006, + 9946, + 24724, + 11, + 1930, + 38694, + 8645, + 17680, + 23985, + 1512, + 28416, + 13, + 51166 + ], + "temperature": 0.0, + "avg_logprob": -0.2362650940749819, + "compression_ratio": 1.6238532110091743, + "no_speech_prob": 0.15368737280368805, + "confidence": 0.912, + "words": [ + { + "text": "Alors", + "start": 13.38, + "end": 13.58, + "confidence": 0.584 + }, + { + "text": "évidemment,", + "start": 13.58, + "end": 13.86, + "confidence": 0.832 + }, + { + "text": "il", + "start": 14.26, + "end": 14.42, + "confidence": 0.953 + }, + { + "text": "faudrait", + "start": 14.42, + "end": 14.76, + "confidence": 0.996 + }, + { + "text": "ajouter", + "start": 14.76, + "end": 15.2, + "confidence": 0.992 + }, + { + "text": "les", + "start": 15.2, + "end": 15.6, + "confidence": 0.985 + }, + { + "text": "interfaces.", + "start": 15.6, + "end": 16.04, + "confidence": 0.984 + } + ] + }, + { + "id": 5, + "seek": 0, + "start": 16.22, + "end": 19.36, + "text": " L'écran tactile a été beaucoup très souvent mentionné.", + "tokens": [ + 51166, + 441, + 6, + 9062, + 4257, + 47319, + 257, + 8862, + 8796, + 5732, + 20847, + 2152, + 15055, + 13, + 51331 + ], + "temperature": 0.0, + "avg_logprob": -0.2362650940749819, + "compression_ratio": 1.6238532110091743, + "no_speech_prob": 0.15368737280368805, + "confidence": 0.923, + "words": [ + { + "text": "L'écran", + "start": 16.22, + "end": 16.78, + "confidence": 0.996 + }, + { + "text": "tactile", + "start": 16.78, + "end": 17.1, + "confidence": 0.986 + }, + { + "text": "a", + "start": 17.1, + "end": 17.3, + "confidence": 0.98 + }, + { + "text": "été", + "start": 17.3, + "end": 17.84, + "confidence": 0.974 + }, + { + "text": "beaucoup", + "start": 17.84, + "end": 18.28, + "confidence": 0.976 + }, + { + "text": "très", + "start": 18.28, + "end": 18.62, + "confidence": 0.447 + }, + { + "text": "souvent", + "start": 18.62, + "end": 18.9, + "confidence": 0.996 + }, + { + "text": "mentionné.", + "start": 18.9, + "end": 19.36, + "confidence": 0.978 + } + ] + }, + { + "id": 6, + "seek": 0, + "start": 20.02, + "end": 25.44, + "text": " Mais bon, il faut dire qu'il profite aussi de 20 ans pendant lesquels les ordinateurs nous ont appris à cliquer sur des icônes.", + "tokens": [ + 51331, + 6313, + 4428, + 11, + 1930, + 8487, + 1264, + 421, + 6, + 388, + 1740, + 642, + 6212, + 368, + 945, + 1567, + 17338, + 1512, + 358, + 1625, + 1512, + 4792, + 13923, + 2156, + 4666, + 6592, + 724, + 5714, + 1531, + 596, + 23909, + 1022, + 730, + 4376, + 2851, + 4081, + 13, + 51631 + ], + "temperature": 0.0, + "avg_logprob": -0.2362650940749819, + "compression_ratio": 1.6238532110091743, + "no_speech_prob": 0.15368737280368805, + "confidence": 0.92, + "words": [ + { + "text": "Mais", + "start": 20.02, + "end": 20.26, + "confidence": 0.943 + }, + { + "text": "bon,", + "start": 20.26, + "end": 20.5, + "confidence": 0.666 + }, + { + "text": "il", + "start": 20.52, + "end": 20.62, + "confidence": 0.99 + }, + { + "text": "faut", + "start": 20.62, + "end": 20.7, + "confidence": 0.99 + }, + { + "text": "dire", + "start": 20.7, + "end": 20.82, + "confidence": 0.995 + }, + { + "text": "qu'il", + "start": 20.82, + "end": 21.04, + "confidence": 0.88 + }, + { + "text": "profite", + "start": 21.04, + "end": 21.3, + "confidence": 0.995 + }, + { + "text": "aussi", + "start": 21.3, + "end": 21.7, + "confidence": 0.972 + }, + { + "text": "de", + "start": 21.7, + "end": 21.94, + "confidence": 0.97 + }, + { + "text": "20", + "start": 21.94, + "end": 22.16, + "confidence": 0.812 + }, + { + "text": "ans", + "start": 22.16, + "end": 22.3, + "confidence": 0.997 + }, + { + "text": "pendant", + "start": 22.3, + "end": 22.54, + "confidence": 0.723 + }, + { + "text": "lesquels", + "start": 22.54, + "end": 22.92, + "confidence": 0.98 + }, + { + "text": "les", + "start": 22.92, + "end": 23.14, + "confidence": 0.71 + }, + { + "text": "ordinateurs", + "start": 23.14, + "end": 23.58, + "confidence": 0.966 + }, + { + "text": "nous", + "start": 23.58, + "end": 23.74, + "confidence": 0.602 + }, + { + "text": "ont", + "start": 23.74, + "end": 23.88, + "confidence": 0.974 + }, + { + "text": "appris", + "start": 23.88, + "end": 24.12, + "confidence": 0.991 + }, + { + "text": "à", + "start": 24.12, + "end": 24.26, + "confidence": 0.828 + }, + { + "text": "cliquer", + "start": 24.26, + "end": 24.54, + "confidence": 0.989 + }, + { + "text": "sur", + "start": 24.54, + "end": 24.72, + "confidence": 0.984 + }, + { + "text": "des", + "start": 24.72, + "end": 24.92, + "confidence": 0.971 + }, + { + "text": "icônes.", + "start": 24.92, + "end": 25.44, + "confidence": 0.992 + } + ] + }, + { + "id": 7, + "seek": 2534, + "start": 25.54, + "end": 30.64, + "text": " Sauf que le smartphone ajoute le toucher, ce qui rend le contact plus direct, plus sensible.", + "tokens": [ + 50364, + 318, + 9507, + 631, + 476, + 13307, + 17680, + 14040, + 476, + 2557, + 260, + 11, + 1769, + 1956, + 6125, + 476, + 3385, + 1804, + 2047, + 11, + 1804, + 25380, + 13, + 50639 + ], + "temperature": 0.0, + "avg_logprob": -0.10785348191220537, + "compression_ratio": 1.6254416961130742, + "no_speech_prob": 0.18929888308048248, + "confidence": 0.968, + "words": [ + { + "text": "Sauf", + "start": 25.54, + "end": 25.82, + "confidence": 0.974 + }, + { + "text": "que", + "start": 25.82, + "end": 26.3, + "confidence": 0.996 + }, + { + "text": "le", + "start": 26.3, + "end": 26.66, + "confidence": 0.671 + }, + { + "text": "smartphone", + "start": 26.66, + "end": 27.08, + "confidence": 0.995 + }, + { + "text": "ajoute", + "start": 27.08, + "end": 27.48, + "confidence": 0.99 + }, + { + "text": "le", + "start": 27.48, + "end": 27.66, + "confidence": 0.989 + }, + { + "text": "toucher,", + "start": 27.66, + "end": 28.06, + "confidence": 0.987 + }, + { + "text": "ce", + "start": 28.14, + "end": 28.16, + "confidence": 0.952 + }, + { + "text": "qui", + "start": 28.16, + "end": 28.3, + "confidence": 1.0 + }, + { + "text": "rend", + "start": 28.3, + "end": 28.54, + "confidence": 0.994 + }, + { + "text": "le", + "start": 28.54, + "end": 28.8, + "confidence": 0.992 + }, + { + "text": "contact", + "start": 28.8, + "end": 29.16, + "confidence": 0.999 + }, + { + "text": "plus", + "start": 29.16, + "end": 29.58, + "confidence": 0.983 + }, + { + "text": "direct,", + "start": 29.58, + "end": 30.0, + "confidence": 0.991 + }, + { + "text": "plus", + "start": 30.1, + "end": 30.24, + "confidence": 0.99 + }, + { + "text": "sensible.", + "start": 30.24, + "end": 30.64, + "confidence": 0.997 + } + ] + }, + { + "id": 8, + "seek": 2534, + "start": 31.04, + "end": 37.82, + "text": " Et puis évidemment, il faudrait parler aussi des applications qui permettent de contourner le côté touffu de la navigation web pour aller directement au but.", + "tokens": [ + 50639, + 3790, + 9093, + 24724, + 11, + 1930, + 38694, + 8645, + 16421, + 6212, + 730, + 5821, + 1956, + 21540, + 317, + 368, + 21234, + 1193, + 476, + 18437, + 10095, + 602, + 84, + 368, + 635, + 17346, + 3670, + 2016, + 8722, + 37297, + 1609, + 457, + 13, + 50989 + ], + "temperature": 0.0, + "avg_logprob": -0.10785348191220537, + "compression_ratio": 1.6254416961130742, + "no_speech_prob": 0.18929888308048248, + "confidence": 0.893, + "words": [ + { + "text": "Et", + "start": 31.04, + "end": 31.24, + "confidence": 0.964 + }, + { + "text": "puis", + "start": 31.24, + "end": 31.34, + "confidence": 0.967 + }, + { + "text": "évidemment,", + "start": 31.34, + "end": 31.62, + "confidence": 0.87 + }, + { + "text": "il", + "start": 31.66, + "end": 31.72, + "confidence": 0.99 + }, + { + "text": "faudrait", + "start": 31.72, + "end": 31.94, + "confidence": 0.996 + }, + { + "text": "parler", + "start": 31.94, + "end": 32.16, + "confidence": 0.864 + }, + { + "text": "aussi", + "start": 32.16, + "end": 32.34, + "confidence": 0.971 + }, + { + "text": "des", + "start": 32.34, + "end": 32.48, + "confidence": 0.993 + }, + { + "text": "applications", + "start": 32.48, + "end": 32.92, + "confidence": 0.993 + }, + { + "text": "qui", + "start": 32.92, + "end": 33.22, + "confidence": 0.564 + }, + { + "text": "permettent", + "start": 33.22, + "end": 33.76, + "confidence": 0.99 + }, + { + "text": "de", + "start": 33.76, + "end": 33.98, + "confidence": 0.871 + }, + { + "text": "contourner", + "start": 33.98, + "end": 34.42, + "confidence": 0.953 + }, + { + "text": "le", + "start": 34.42, + "end": 34.54, + "confidence": 0.75 + }, + { + "text": "côté", + "start": 34.54, + "end": 34.78, + "confidence": 0.985 + }, + { + "text": "touffu", + "start": 34.78, + "end": 35.32, + "confidence": 0.726 + }, + { + "text": "de", + "start": 35.32, + "end": 35.7, + "confidence": 0.882 + }, + { + "text": "la", + "start": 35.7, + "end": 35.82, + "confidence": 0.991 + }, + { + "text": "navigation", + "start": 35.82, + "end": 36.3, + "confidence": 0.992 + }, + { + "text": "web", + "start": 36.3, + "end": 36.58, + "confidence": 0.847 + }, + { + "text": "pour", + "start": 36.58, + "end": 36.76, + "confidence": 0.59 + }, + { + "text": "aller", + "start": 36.76, + "end": 37.16, + "confidence": 0.981 + }, + { + "text": "directement", + "start": 37.16, + "end": 37.54, + "confidence": 0.997 + }, + { + "text": "au", + "start": 37.54, + "end": 37.7, + "confidence": 0.969 + }, + { + "text": "but.", + "start": 37.7, + "end": 37.82, + "confidence": 0.995 + } + ] + }, + { + "id": 9, + "seek": 2534, + "start": 37.9, + "end": 46.6, + "text": " Bref, tout ça, ce sont les conditions qui permettent de créer cet objet dont Nicolas dit qu'il est vraisemblablement inédit dans l'histoire de l'humanité.", + "tokens": [ + 50989, + 49957, + 11, + 3486, + 2788, + 11, + 1769, + 4900, + 1512, + 4487, + 1956, + 21540, + 317, + 368, + 32062, + 8603, + 14964, + 9400, + 38268, + 6176, + 421, + 6, + 388, + 871, + 6070, + 271, + 443, + 5199, + 712, + 518, + 294, + 7811, + 270, + 2680, + 287, + 6, + 29093, + 368, + 287, + 6, + 18796, + 5066, + 13, + 51439 + ], + "temperature": 0.0, + "avg_logprob": -0.10785348191220537, + "compression_ratio": 1.6254416961130742, + "no_speech_prob": 0.18929888308048248, + "confidence": 0.973, + "words": [ + { + "text": "Bref,", + "start": 37.9, + "end": 38.24, + "confidence": 0.984 + }, + { + "text": "tout", + "start": 38.88, + "end": 39.02, + "confidence": 0.701 + }, + { + "text": "ça,", + "start": 39.02, + "end": 39.4, + "confidence": 0.995 + }, + { + "text": "ce", + "start": 39.4, + "end": 39.72, + "confidence": 0.989 + }, + { + "text": "sont", + "start": 39.72, + "end": 39.92, + "confidence": 0.999 + }, + { + "text": "les", + "start": 39.92, + "end": 40.22, + "confidence": 0.992 + }, + { + "text": "conditions", + "start": 40.22, + "end": 40.7, + "confidence": 0.995 + }, + { + "text": "qui", + "start": 40.7, + "end": 41.02, + "confidence": 0.997 + }, + { + "text": "permettent", + "start": 41.02, + "end": 41.44, + "confidence": 0.996 + }, + { + "text": "de", + "start": 41.44, + "end": 41.74, + "confidence": 0.997 + }, + { + "text": "créer", + "start": 41.74, + "end": 42.1, + "confidence": 0.999 + }, + { + "text": "cet", + "start": 42.1, + "end": 42.38, + "confidence": 0.997 + }, + { + "text": "objet", + "start": 42.38, + "end": 42.64, + "confidence": 0.994 + }, + { + "text": "dont", + "start": 42.64, + "end": 42.84, + "confidence": 0.789 + }, + { + "text": "Nicolas", + "start": 42.84, + "end": 43.24, + "confidence": 0.988 + }, + { + "text": "dit", + "start": 43.24, + "end": 43.52, + "confidence": 0.986 + }, + { + "text": "qu'il", + "start": 43.52, + "end": 43.74, + "confidence": 0.982 + }, + { + "text": "est", + "start": 43.74, + "end": 43.94, + "confidence": 0.99 + }, + { + "text": "vraisemblablement", + "start": 43.94, + "end": 44.86, + "confidence": 0.99 + }, + { + "text": "inédit", + "start": 44.86, + "end": 45.44, + "confidence": 0.98 + }, + { + "text": "dans", + "start": 45.44, + "end": 45.72, + "confidence": 0.967 + }, + { + "text": "l'histoire", + "start": 45.72, + "end": 46.02, + "confidence": 0.958 + }, + { + "text": "de", + "start": 46.02, + "end": 46.14, + "confidence": 0.999 + }, + { + "text": "l'humanité.", + "start": 46.14, + "end": 46.6, + "confidence": 0.992 + } + ] + }, + { + "id": 10, + "seek": 2534, + "start": 47.02, + "end": 48.78, + "text": " Mais ça, ça soulève une autre interrogation.", + "tokens": [ + 51439, + 6313, + 2788, + 11, + 2788, + 5133, + 31397, + 2251, + 15081, + 24871, + 399, + 13, + 51539 + ], + "temperature": 0.0, + "avg_logprob": -0.10785348191220537, + "compression_ratio": 1.6254416961130742, + "no_speech_prob": 0.18929888308048248, + "confidence": 0.969, + "words": [ + { + "text": "Mais", + "start": 47.02, + "end": 47.28, + "confidence": 0.84 + }, + { + "text": "ça,", + "start": 47.28, + "end": 47.48, + "confidence": 0.942 + }, + { + "text": "ça", + "start": 47.62, + "end": 47.64, + "confidence": 0.976 + }, + { + "text": "soulève", + "start": 47.64, + "end": 47.86, + "confidence": 0.993 + }, + { + "text": "une", + "start": 47.86, + "end": 48.02, + "confidence": 0.998 + }, + { + "text": "autre", + "start": 48.02, + "end": 48.2, + "confidence": 0.999 + }, + { + "text": "interrogation.", + "start": 48.2, + "end": 48.78, + "confidence": 0.997 + } + ] + }, + { + "id": 11, + "seek": 4884, + "start": 49.36, + "end": 55.5, + "text": " Est-ce que le fait que cet objet soit inédit induit que notre rapport à lui est aussi un rapport inédit ?", + "tokens": [ + 50389, + 4410, + 12, + 384, + 631, + 476, + 3887, + 631, + 8603, + 14964, + 12703, + 294, + 7811, + 270, + 13716, + 270, + 631, + 10349, + 18018, + 1531, + 8783, + 871, + 6212, + 517, + 18018, + 294, + 7811, + 270, + 2506, + 50689 + ], + "temperature": 0.0, + "avg_logprob": -0.08241327932058287, + "compression_ratio": 1.5960784313725491, + "no_speech_prob": 0.09794807434082031, + "confidence": 0.986, + "words": [ + { + "text": "Est-ce", + "start": 49.36, + "end": 49.64, + "confidence": 0.978 + }, + { + "text": "que", + "start": 49.64, + "end": 49.76, + "confidence": 0.991 + }, + { + "text": "le", + "start": 49.76, + "end": 49.82, + "confidence": 0.993 + }, + { + "text": "fait", + "start": 49.82, + "end": 50.0, + "confidence": 0.999 + }, + { + "text": "que", + "start": 50.0, + "end": 50.14, + "confidence": 0.991 + }, + { + "text": "cet", + "start": 50.14, + "end": 50.32, + "confidence": 0.99 + }, + { + "text": "objet", + "start": 50.32, + "end": 50.66, + "confidence": 0.997 + }, + { + "text": "soit", + "start": 50.66, + "end": 51.12, + "confidence": 0.995 + }, + { + "text": "inédit", + "start": 51.12, + "end": 51.78, + "confidence": 0.995 + }, + { + "text": "induit", + "start": 51.78, + "end": 52.32, + "confidence": 0.955 + }, + { + "text": "que", + "start": 52.32, + "end": 52.42, + "confidence": 0.984 + }, + { + "text": "notre", + "start": 52.42, + "end": 52.78, + "confidence": 0.995 + }, + { + "text": "rapport", + "start": 52.78, + "end": 53.28, + "confidence": 0.997 + }, + { + "text": "à", + "start": 53.28, + "end": 53.46, + "confidence": 0.978 + }, + { + "text": "lui", + "start": 53.46, + "end": 53.68, + "confidence": 0.999 + }, + { + "text": "est", + "start": 53.68, + "end": 54.14, + "confidence": 0.907 + }, + { + "text": "aussi", + "start": 54.14, + "end": 54.52, + "confidence": 0.996 + }, + { + "text": "un", + "start": 54.52, + "end": 54.72, + "confidence": 0.994 + }, + { + "text": "rapport", + "start": 54.72, + "end": 55.0, + "confidence": 0.997 + }, + { + "text": "inédit ?", + "start": 55.0, + "end": 55.5, + "confidence": 0.996 + } + ] + }, + { + "id": 12, + "seek": 4884, + "start": 55.76, + "end": 63.4, + "text": " Je veux dire, est-ce que le rapport qu'on a au smartphone est comparable à celui qu'on entretenait à d'autres objets techniques comme la voiture ou le téléphone ?", + "tokens": [ + 50689, + 2588, + 16389, + 1264, + 11, + 871, + 12, + 384, + 631, + 476, + 18018, + 421, + 6, + 266, + 257, + 1609, + 13307, + 871, + 25323, + 1531, + 22829, + 421, + 6, + 266, + 3962, + 1147, + 1001, + 1531, + 274, + 6, + 16752, + 1111, + 25349, + 7512, + 5173, + 635, + 38859, + 2820, + 476, + 47159, + 2506, + 51089 + ], + "temperature": 0.0, + "avg_logprob": -0.08241327932058287, + "compression_ratio": 1.5960784313725491, + "no_speech_prob": 0.09794807434082031, + "confidence": 0.96, + "words": [ + { + "text": "Je", + "start": 55.76, + "end": 55.9, + "confidence": 0.904 + }, + { + "text": "veux", + "start": 55.9, + "end": 56.0, + "confidence": 0.989 + }, + { + "text": "dire,", + "start": 56.0, + "end": 56.12, + "confidence": 0.997 + }, + { + "text": "est-ce", + "start": 56.22, + "end": 56.38, + "confidence": 0.99 + }, + { + "text": "que", + "start": 56.38, + "end": 56.5, + "confidence": 0.991 + }, + { + "text": "le", + "start": 56.5, + "end": 56.66, + "confidence": 0.996 + }, + { + "text": "rapport", + "start": 56.66, + "end": 56.86, + "confidence": 0.998 + }, + { + "text": "qu'on", + "start": 56.86, + "end": 57.08, + "confidence": 0.985 + }, + { + "text": "a", + "start": 57.08, + "end": 57.16, + "confidence": 0.99 + }, + { + "text": "au", + "start": 57.16, + "end": 57.28, + "confidence": 0.966 + }, + { + "text": "smartphone", + "start": 57.28, + "end": 57.6, + "confidence": 0.995 + }, + { + "text": "est", + "start": 57.6, + "end": 57.86, + "confidence": 0.91 + }, + { + "text": "comparable", + "start": 57.86, + "end": 58.3, + "confidence": 0.996 + }, + { + "text": "à", + "start": 58.3, + "end": 58.5, + "confidence": 0.946 + }, + { + "text": "celui", + "start": 58.5, + "end": 58.66, + "confidence": 0.998 + }, + { + "text": "qu'on", + "start": 58.66, + "end": 58.96, + "confidence": 0.989 + }, + { + "text": "entretenait", + "start": 58.96, + "end": 59.36, + "confidence": 0.926 + }, + { + "text": "à", + "start": 59.36, + "end": 59.48, + "confidence": 0.951 + }, + { + "text": "d'autres", + "start": 59.48, + "end": 59.7, + "confidence": 0.997 + }, + { + "text": "objets", + "start": 59.7, + "end": 59.98, + "confidence": 0.99 + }, + { + "text": "techniques", + "start": 59.98, + "end": 60.44, + "confidence": 0.984 + }, + { + "text": "comme", + "start": 60.44, + "end": 60.96, + "confidence": 0.496 + }, + { + "text": "la", + "start": 60.96, + "end": 61.52, + "confidence": 0.987 + }, + { + "text": "voiture", + "start": 61.52, + "end": 62.08, + "confidence": 1.0 + }, + { + "text": "ou", + "start": 62.08, + "end": 62.52, + "confidence": 0.95 + }, + { + "text": "le", + "start": 62.52, + "end": 62.74, + "confidence": 0.998 + }, + { + "text": "téléphone ?", + "start": 62.74, + "end": 63.4, + "confidence": 0.999 + } + ] + }, + { + "id": 13, + "seek": 4884, + "start": 65.36, + "end": 66.62, + "text": " Il n'y a pas d'équivalent en fait.", + "tokens": [ + 51189, + 4416, + 297, + 6, + 88, + 257, + 1736, + 274, + 6, + 20183, + 3576, + 317, + 465, + 3887, + 13, + 51239 + ], + "temperature": 0.0, + "avg_logprob": -0.08241327932058287, + "compression_ratio": 1.5960784313725491, + "no_speech_prob": 0.09794807434082031, + "confidence": 0.94, + "words": [ + { + "text": "Il", + "start": 65.36, + "end": 65.5, + "confidence": 0.849 + }, + { + "text": "n'y", + "start": 65.5, + "end": 65.54, + "confidence": 0.979 + }, + { + "text": "a", + "start": 65.54, + "end": 65.56, + "confidence": 0.993 + }, + { + "text": "pas", + "start": 65.56, + "end": 65.66, + "confidence": 0.999 + }, + { + "text": "d'équivalent", + "start": 65.66, + "end": 66.3, + "confidence": 0.995 + }, + { + "text": "en", + "start": 66.3, + "end": 66.44, + "confidence": 0.582 + }, + { + "text": "fait.", + "start": 66.44, + "end": 66.62, + "confidence": 0.997 + } + ] + }, + { + "id": 14, + "seek": 4884, + "start": 66.88, + "end": 71.24, + "text": " Et donc cette espèce de nouveauté dans la relation à l'objet, c'est fascinant et terrifiant.", + "tokens": [ + 51239, + 3790, + 5926, + 5550, + 7089, + 30236, + 368, + 11456, + 1375, + 526, + 2680, + 635, + 9721, + 1531, + 287, + 6, + 996, + 7108, + 11, + 269, + 6, + 377, + 7184, + 259, + 394, + 1030, + 7245, + 351, + 5798, + 13, + 51489 + ], + "temperature": 0.0, + "avg_logprob": -0.08241327932058287, + "compression_ratio": 1.5960784313725491, + "no_speech_prob": 0.09794807434082031, + "confidence": 0.957, + "words": [ + { + "text": "Et", + "start": 66.88, + "end": 67.02, + "confidence": 0.654 + }, + { + "text": "donc", + "start": 67.02, + "end": 67.12, + "confidence": 0.901 + }, + { + "text": "cette", + "start": 67.12, + "end": 67.3, + "confidence": 0.713 + }, + { + "text": "espèce", + "start": 67.3, + "end": 67.54, + "confidence": 0.996 + }, + { + "text": "de", + "start": 67.54, + "end": 67.76, + "confidence": 0.999 + }, + { + "text": "nouveauté", + "start": 67.76, + "end": 68.48, + "confidence": 0.98 + }, + { + "text": "dans", + "start": 68.48, + "end": 68.84, + "confidence": 0.982 + }, + { + "text": "la", + "start": 68.84, + "end": 68.96, + "confidence": 0.995 + }, + { + "text": "relation", + "start": 68.96, + "end": 69.24, + "confidence": 0.998 + }, + { + "text": "à", + "start": 69.24, + "end": 69.38, + "confidence": 0.997 + }, + { + "text": "l'objet,", + "start": 69.38, + "end": 70.0, + "confidence": 0.998 + }, + { + "text": "c'est", + "start": 70.28, + "end": 70.38, + "confidence": 0.977 + }, + { + "text": "fascinant", + "start": 70.38, + "end": 70.68, + "confidence": 0.98 + }, + { + "text": "et", + "start": 70.68, + "end": 70.76, + "confidence": 0.973 + }, + { + "text": "terrifiant.", + "start": 70.76, + "end": 71.24, + "confidence": 0.977 + } + ] + }, + { + "id": 15, + "seek": 7134, + "start": 71.62, + "end": 76.42, + "text": " Parce qu'on a l'impression, comme le disent les utilisateurs et les services, d'être dépendant de cet objet,", + "tokens": [ + 50389, + 20429, + 421, + 6, + 266, + 257, + 287, + 6, + 36107, + 11, + 5173, + 476, + 37313, + 1512, + 33643, + 25929, + 1030, + 1512, + 3328, + 11, + 274, + 6, + 9498, + 45768, + 394, + 368, + 8603, + 14964, + 11, + 50639 + ], + "temperature": 0.0, + "avg_logprob": -0.11220460018869173, + "compression_ratio": 1.5975609756097562, + "no_speech_prob": 0.015181643888354301, + "confidence": 0.862, + "words": [ + { + "text": "Parce", + "start": 71.62, + "end": 71.9, + "confidence": 0.843 + }, + { + "text": "qu'on", + "start": 71.9, + "end": 72.4, + "confidence": 0.968 + }, + { + "text": "a", + "start": 72.4, + "end": 72.54, + "confidence": 0.979 + }, + { + "text": "l'impression,", + "start": 72.54, + "end": 72.9, + "confidence": 0.997 + }, + { + "text": "comme", + "start": 73.66, + "end": 73.9, + "confidence": 0.982 + }, + { + "text": "le", + "start": 73.9, + "end": 74.02, + "confidence": 0.984 + }, + { + "text": "disent", + "start": 74.02, + "end": 74.22, + "confidence": 0.997 + }, + { + "text": "les", + "start": 74.22, + "end": 74.52, + "confidence": 0.996 + }, + { + "text": "utilisateurs", + "start": 74.52, + "end": 74.84, + "confidence": 0.998 + }, + { + "text": "et", + "start": 74.84, + "end": 74.94, + "confidence": 0.845 + }, + { + "text": "les", + "start": 74.94, + "end": 75.02, + "confidence": 0.783 + }, + { + "text": "services,", + "start": 75.02, + "end": 75.18, + "confidence": 0.129 + }, + { + "text": "d'être", + "start": 75.22, + "end": 75.5, + "confidence": 0.935 + }, + { + "text": "dépendant", + "start": 75.5, + "end": 75.98, + "confidence": 0.709 + }, + { + "text": "de", + "start": 75.98, + "end": 76.08, + "confidence": 0.977 + }, + { + "text": "cet", + "start": 76.08, + "end": 76.26, + "confidence": 0.998 + }, + { + "text": "objet,", + "start": 76.26, + "end": 76.42, + "confidence": 0.997 + } + ] + }, + { + "id": 16, + "seek": 7134, + "start": 76.42, + "end": 83.3, + "text": " d'induire en fait une espèce de relation, de médiation avec le monde qui rend de l'ampleur et qui amène aussi à des formes de rejet.", + "tokens": [ + 50639, + 274, + 6, + 471, + 43612, + 465, + 3887, + 2251, + 7089, + 30236, + 368, + 9721, + 11, + 368, + 42436, + 399, + 4163, + 476, + 10431, + 1956, + 6125, + 368, + 287, + 6, + 335, + 781, + 374, + 1030, + 1956, + 669, + 18832, + 6212, + 1531, + 730, + 1254, + 279, + 368, + 319, + 7108, + 13, + 50989 + ], + "temperature": 0.0, + "avg_logprob": -0.11220460018869173, + "compression_ratio": 1.5975609756097562, + "no_speech_prob": 0.015181643888354301, + "confidence": 0.923, + "words": [ + { + "text": "d'induire", + "start": 76.42, + "end": 77.1, + "confidence": 0.964 + }, + { + "text": "en", + "start": 77.1, + "end": 77.18, + "confidence": 0.72 + }, + { + "text": "fait", + "start": 77.18, + "end": 77.34, + "confidence": 0.997 + }, + { + "text": "une", + "start": 77.34, + "end": 77.5, + "confidence": 0.979 + }, + { + "text": "espèce", + "start": 77.5, + "end": 77.88, + "confidence": 0.997 + }, + { + "text": "de", + "start": 77.88, + "end": 78.28, + "confidence": 0.997 + }, + { + "text": "relation,", + "start": 78.28, + "end": 78.54, + "confidence": 0.422 + }, + { + "text": "de", + "start": 78.66, + "end": 78.96, + "confidence": 0.992 + }, + { + "text": "médiation", + "start": 78.96, + "end": 79.52, + "confidence": 0.997 + }, + { + "text": "avec", + "start": 79.52, + "end": 79.76, + "confidence": 0.954 + }, + { + "text": "le", + "start": 79.76, + "end": 80.02, + "confidence": 0.998 + }, + { + "text": "monde", + "start": 80.02, + "end": 80.3, + "confidence": 0.996 + }, + { + "text": "qui", + "start": 80.3, + "end": 81.24, + "confidence": 0.661 + }, + { + "text": "rend", + "start": 81.24, + "end": 81.66, + "confidence": 0.968 + }, + { + "text": "de", + "start": 81.66, + "end": 81.74, + "confidence": 0.688 + }, + { + "text": "l'ampleur", + "start": 81.74, + "end": 82.02, + "confidence": 0.995 + }, + { + "text": "et", + "start": 82.02, + "end": 82.1, + "confidence": 0.952 + }, + { + "text": "qui", + "start": 82.1, + "end": 82.2, + "confidence": 0.987 + }, + { + "text": "amène", + "start": 82.2, + "end": 82.38, + "confidence": 0.971 + }, + { + "text": "aussi", + "start": 82.38, + "end": 82.54, + "confidence": 0.946 + }, + { + "text": "à", + "start": 82.54, + "end": 82.62, + "confidence": 0.959 + }, + { + "text": "des", + "start": 82.62, + "end": 82.7, + "confidence": 0.992 + }, + { + "text": "formes", + "start": 82.7, + "end": 82.88, + "confidence": 0.995 + }, + { + "text": "de", + "start": 82.88, + "end": 83.04, + "confidence": 0.998 + }, + { + "text": "rejet.", + "start": 83.04, + "end": 83.3, + "confidence": 0.802 + } + ] + }, + { + "id": 17, + "seek": 7134, + "start": 83.92, + "end": 87.7, + "text": " Donc à objet inédit, rapport inédit.", + "tokens": [ + 50989, + 7477, + 1531, + 14964, + 294, + 7811, + 270, + 11, + 18018, + 294, + 7811, + 270, + 13, + 51189 + ], + "temperature": 0.0, + "avg_logprob": -0.11220460018869173, + "compression_ratio": 1.5975609756097562, + "no_speech_prob": 0.015181643888354301, + "confidence": 0.901, + "words": [ + { + "text": "Donc", + "start": 83.92, + "end": 84.46, + "confidence": 0.984 + }, + { + "text": "à", + "start": 84.46, + "end": 84.98, + "confidence": 0.483 + }, + { + "text": "objet", + "start": 84.98, + "end": 85.46, + "confidence": 0.77 + }, + { + "text": "inédit,", + "start": 85.46, + "end": 86.2, + "confidence": 0.994 + }, + { + "text": "rapport", + "start": 86.54, + "end": 86.9, + "confidence": 0.986 + }, + { + "text": "inédit.", + "start": 86.9, + "end": 87.7, + "confidence": 0.998 + } + ] + }, + { + "id": 18, + "seek": 7134, + "start": 88.02, + "end": 94.92, + "text": " Et ce rapport, si j'en crois à Nicolas, serait caractérisé par un mélange de dépendance et de rejet.", + "tokens": [ + 51189, + 3790, + 1769, + 18018, + 11, + 1511, + 361, + 6, + 268, + 21724, + 1531, + 38268, + 11, + 23139, + 1032, + 578, + 4198, + 22118, + 971, + 517, + 41953, + 933, + 368, + 45768, + 719, + 1030, + 368, + 319, + 7108, + 13, + 51539 + ], + "temperature": 0.0, + "avg_logprob": -0.11220460018869173, + "compression_ratio": 1.5975609756097562, + "no_speech_prob": 0.015181643888354301, + "confidence": 0.975, + "words": [ + { + "text": "Et", + "start": 88.02, + "end": 88.62, + "confidence": 0.989 + }, + { + "text": "ce", + "start": 88.62, + "end": 88.9, + "confidence": 0.985 + }, + { + "text": "rapport,", + "start": 88.9, + "end": 89.32, + "confidence": 0.998 + }, + { + "text": "si", + "start": 89.38, + "end": 89.56, + "confidence": 0.999 + }, + { + "text": "j'en", + "start": 89.56, + "end": 89.78, + "confidence": 0.997 + }, + { + "text": "crois", + "start": 89.78, + "end": 89.88, + "confidence": 0.988 + }, + { + "text": "à", + "start": 89.88, + "end": 90.06, + "confidence": 0.724 + }, + { + "text": "Nicolas,", + "start": 90.06, + "end": 90.24, + "confidence": 0.997 + }, + { + "text": "serait", + "start": 90.7, + "end": 91.0, + "confidence": 0.904 + }, + { + "text": "caractérisé", + "start": 91.0, + "end": 91.8, + "confidence": 0.994 + }, + { + "text": "par", + "start": 91.8, + "end": 92.22, + "confidence": 0.995 + }, + { + "text": "un", + "start": 92.22, + "end": 92.52, + "confidence": 0.996 + }, + { + "text": "mélange", + "start": 92.52, + "end": 93.04, + "confidence": 0.999 + }, + { + "text": "de", + "start": 93.04, + "end": 93.46, + "confidence": 0.998 + }, + { + "text": "dépendance", + "start": 93.46, + "end": 94.12, + "confidence": 0.938 + }, + { + "text": "et", + "start": 94.12, + "end": 94.54, + "confidence": 0.998 + }, + { + "text": "de", + "start": 94.54, + "end": 94.72, + "confidence": 0.999 + }, + { + "text": "rejet.", + "start": 94.72, + "end": 94.92, + "confidence": 0.988 + } + ] + }, + { + "id": 19, + "seek": 9484, + "start": 95.74, + "end": 102.82, + "text": " Bon, en vrai, il faudrait remonter très très finement toute l'histoire des objets techniques et de leur insertion dans nos vies", + "tokens": [ + 50389, + 7368, + 11, + 465, + 17815, + 11, + 1930, + 38694, + 8645, + 890, + 41806, + 5732, + 5732, + 962, + 1712, + 14953, + 287, + 6, + 29093, + 730, + 1111, + 25349, + 7512, + 1030, + 368, + 9580, + 8969, + 313, + 2680, + 3269, + 371, + 530, + 50739 + ], + "temperature": 0.0, + "avg_logprob": -0.0781538827078683, + "compression_ratio": 1.6719745222929936, + "no_speech_prob": 0.017434891313314438, + "confidence": 0.932, + "words": [ + { + "text": "Bon,", + "start": 95.74, + "end": 96.0, + "confidence": 0.751 + }, + { + "text": "en", + "start": 96.34, + "end": 96.54, + "confidence": 0.992 + }, + { + "text": "vrai,", + "start": 96.54, + "end": 96.86, + "confidence": 0.991 + }, + { + "text": "il", + "start": 97.06, + "end": 97.18, + "confidence": 0.992 + }, + { + "text": "faudrait", + "start": 97.18, + "end": 97.58, + "confidence": 0.996 + }, + { + "text": "remonter", + "start": 97.58, + "end": 98.06, + "confidence": 0.995 + }, + { + "text": "très", + "start": 98.06, + "end": 98.58, + "confidence": 0.995 + }, + { + "text": "très", + "start": 98.58, + "end": 98.84, + "confidence": 0.757 + }, + { + "text": "finement", + "start": 98.84, + "end": 99.38, + "confidence": 0.823 + }, + { + "text": "toute", + "start": 99.38, + "end": 99.7, + "confidence": 0.937 + }, + { + "text": "l'histoire", + "start": 99.7, + "end": 100.08, + "confidence": 0.996 + }, + { + "text": "des", + "start": 100.08, + "end": 100.26, + "confidence": 0.991 + }, + { + "text": "objets", + "start": 100.26, + "end": 100.52, + "confidence": 0.998 + }, + { + "text": "techniques", + "start": 100.52, + "end": 100.94, + "confidence": 0.982 + }, + { + "text": "et", + "start": 100.94, + "end": 101.54, + "confidence": 0.512 + }, + { + "text": "de", + "start": 101.54, + "end": 101.7, + "confidence": 0.984 + }, + { + "text": "leur", + "start": 101.7, + "end": 101.84, + "confidence": 0.818 + }, + { + "text": "insertion", + "start": 101.84, + "end": 102.34, + "confidence": 0.994 + }, + { + "text": "dans", + "start": 102.34, + "end": 102.5, + "confidence": 0.969 + }, + { + "text": "nos", + "start": 102.5, + "end": 102.66, + "confidence": 0.998 + }, + { + "text": "vies", + "start": 102.66, + "end": 102.82, + "confidence": 0.998 + } + ] + }, + { + "id": 20, + "seek": 9484, + "start": 102.86, + "end": 105.72, + "text": " pour déterminer si ce rapport est totalement inédit.", + "tokens": [ + 50739, + 2016, + 2795, + 29725, + 260, + 1511, + 1769, + 18018, + 871, + 45203, + 294, + 7811, + 270, + 13, + 50889 + ], + "temperature": 0.0, + "avg_logprob": -0.0781538827078683, + "compression_ratio": 1.6719745222929936, + "no_speech_prob": 0.017434891313314438, + "confidence": 0.995, + "words": [ + { + "text": "pour", + "start": 102.86, + "end": 103.1, + "confidence": 0.989 + }, + { + "text": "déterminer", + "start": 103.1, + "end": 103.64, + "confidence": 0.995 + }, + { + "text": "si", + "start": 103.64, + "end": 103.76, + "confidence": 0.986 + }, + { + "text": "ce", + "start": 103.76, + "end": 103.94, + "confidence": 0.991 + }, + { + "text": "rapport", + "start": 103.94, + "end": 104.26, + "confidence": 0.998 + }, + { + "text": "est", + "start": 104.26, + "end": 104.84, + "confidence": 0.997 + }, + { + "text": "totalement", + "start": 104.84, + "end": 105.3, + "confidence": 0.998 + }, + { + "text": "inédit.", + "start": 105.3, + "end": 105.72, + "confidence": 0.998 + } + ] + }, + { + "id": 21, + "seek": 9484, + "start": 106.14, + "end": 109.32, + "text": " Mais j'ai l'impression comme ça que Nicolas ne se trompe pas vraiment.", + "tokens": [ + 50889, + 6313, + 361, + 6, + 1301, + 287, + 6, + 36107, + 5173, + 2788, + 631, + 38268, + 408, + 369, + 504, + 298, + 494, + 1736, + 8322, + 13, + 51089 + ], + "temperature": 0.0, + "avg_logprob": -0.0781538827078683, + "compression_ratio": 1.6719745222929936, + "no_speech_prob": 0.017434891313314438, + "confidence": 0.932, + "words": [ + { + "text": "Mais", + "start": 106.14, + "end": 106.4, + "confidence": 0.975 + }, + { + "text": "j'ai", + "start": 106.4, + "end": 106.92, + "confidence": 0.956 + }, + { + "text": "l'impression", + "start": 106.92, + "end": 107.38, + "confidence": 0.999 + }, + { + "text": "comme", + "start": 107.38, + "end": 107.58, + "confidence": 0.513 + }, + { + "text": "ça", + "start": 107.58, + "end": 107.82, + "confidence": 0.969 + }, + { + "text": "que", + "start": 107.82, + "end": 108.14, + "confidence": 0.973 + }, + { + "text": "Nicolas", + "start": 108.14, + "end": 108.48, + "confidence": 0.983 + }, + { + "text": "ne", + "start": 108.48, + "end": 108.6, + "confidence": 0.72 + }, + { + "text": "se", + "start": 108.6, + "end": 108.72, + "confidence": 0.992 + }, + { + "text": "trompe", + "start": 108.72, + "end": 108.88, + "confidence": 0.993 + }, + { + "text": "pas", + "start": 108.88, + "end": 109.08, + "confidence": 0.999 + }, + { + "text": "vraiment.", + "start": 109.08, + "end": 109.32, + "confidence": 0.989 + } + ] + }, + { + "id": 22, + "seek": 9484, + "start": 109.94, + "end": 115.06, + "text": " Pour autant que je sache, il y a eu plein de discussions autour de la voiture ou même du téléphone.", + "tokens": [ + 51089, + 8732, + 34081, + 631, + 1506, + 262, + 6000, + 11, + 1930, + 288, + 257, + 2228, + 21088, + 368, + 11088, + 30249, + 368, + 635, + 38859, + 2820, + 5698, + 1581, + 47159, + 13, + 51389 + ], + "temperature": 0.0, + "avg_logprob": -0.0781538827078683, + "compression_ratio": 1.6719745222929936, + "no_speech_prob": 0.017434891313314438, + "confidence": 0.964, + "words": [ + { + "text": "Pour", + "start": 109.94, + "end": 110.1, + "confidence": 0.995 + }, + { + "text": "autant", + "start": 110.1, + "end": 110.24, + "confidence": 1.0 + }, + { + "text": "que", + "start": 110.24, + "end": 110.38, + "confidence": 0.984 + }, + { + "text": "je", + "start": 110.38, + "end": 110.52, + "confidence": 0.998 + }, + { + "text": "sache,", + "start": 110.52, + "end": 110.84, + "confidence": 0.952 + }, + { + "text": "il", + "start": 111.08, + "end": 111.16, + "confidence": 0.994 + }, + { + "text": "y", + "start": 111.16, + "end": 111.3, + "confidence": 0.995 + }, + { + "text": "a", + "start": 111.3, + "end": 111.32, + "confidence": 0.993 + }, + { + "text": "eu", + "start": 111.32, + "end": 111.62, + "confidence": 0.998 + }, + { + "text": "plein", + "start": 111.62, + "end": 111.9, + "confidence": 0.966 + }, + { + "text": "de", + "start": 111.9, + "end": 112.14, + "confidence": 0.997 + }, + { + "text": "discussions", + "start": 112.14, + "end": 112.66, + "confidence": 0.83 + }, + { + "text": "autour", + "start": 112.66, + "end": 113.02, + "confidence": 0.995 + }, + { + "text": "de", + "start": 113.02, + "end": 113.38, + "confidence": 0.996 + }, + { + "text": "la", + "start": 113.38, + "end": 113.52, + "confidence": 0.998 + }, + { + "text": "voiture", + "start": 113.52, + "end": 113.88, + "confidence": 1.0 + }, + { + "text": "ou", + "start": 113.88, + "end": 114.06, + "confidence": 0.69 + }, + { + "text": "même", + "start": 114.06, + "end": 114.34, + "confidence": 0.995 + }, + { + "text": "du", + "start": 114.34, + "end": 114.64, + "confidence": 0.992 + }, + { + "text": "téléphone.", + "start": 114.64, + "end": 115.06, + "confidence": 0.999 + } + ] + }, + { + "id": 23, + "seek": 9484, + "start": 115.48, + "end": 117.7, + "text": " Mais la dépendance n'était pas du même ordre.", + "tokens": [ + 51389, + 6313, + 635, + 45768, + 719, + 297, + 6, + 9743, + 1736, + 1581, + 5698, + 4792, + 265, + 13, + 51489 + ], + "temperature": 0.0, + "avg_logprob": -0.0781538827078683, + "compression_ratio": 1.6719745222929936, + "no_speech_prob": 0.017434891313314438, + "confidence": 0.992, + "words": [ + { + "text": "Mais", + "start": 115.48, + "end": 115.78, + "confidence": 0.993 + }, + { + "text": "la", + "start": 115.78, + "end": 116.04, + "confidence": 0.943 + }, + { + "text": "dépendance", + "start": 116.04, + "end": 116.42, + "confidence": 0.996 + }, + { + "text": "n'était", + "start": 116.42, + "end": 116.7, + "confidence": 0.994 + }, + { + "text": "pas", + "start": 116.7, + "end": 117.0, + "confidence": 0.998 + }, + { + "text": "du", + "start": 117.0, + "end": 117.2, + "confidence": 0.996 + }, + { + "text": "même", + "start": 117.2, + "end": 117.44, + "confidence": 0.998 + }, + { + "text": "ordre.", + "start": 117.44, + "end": 117.7, + "confidence": 0.999 + } + ] + }, + { + "id": 24, + "seek": 9484, + "start": 117.72, + "end": 119.78, + "text": " Donc le rejet non plus n'était pas du même ordre.", + "tokens": [ + 51489, + 7477, + 476, + 319, + 7108, + 2107, + 1804, + 297, + 6, + 9743, + 1736, + 1581, + 5698, + 4792, + 265, + 13, + 51589 + ], + "temperature": 0.0, + "avg_logprob": -0.0781538827078683, + "compression_ratio": 1.6719745222929936, + "no_speech_prob": 0.017434891313314438, + "confidence": 0.979, + "words": [ + { + "text": "Donc", + "start": 117.72, + "end": 118.02, + "confidence": 0.959 + }, + { + "text": "le", + "start": 118.02, + "end": 118.4, + "confidence": 0.819 + }, + { + "text": "rejet", + "start": 118.4, + "end": 118.64, + "confidence": 0.999 + }, + { + "text": "non", + "start": 118.64, + "end": 118.82, + "confidence": 0.982 + }, + { + "text": "plus", + "start": 118.82, + "end": 118.94, + "confidence": 0.994 + }, + { + "text": "n'était", + "start": 118.94, + "end": 119.18, + "confidence": 0.991 + }, + { + "text": "pas", + "start": 119.18, + "end": 119.3, + "confidence": 0.998 + }, + { + "text": "du", + "start": 119.3, + "end": 119.42, + "confidence": 0.995 + }, + { + "text": "même", + "start": 119.42, + "end": 119.58, + "confidence": 0.999 + }, + { + "text": "ordre.", + "start": 119.58, + "end": 119.78, + "confidence": 0.999 + } + ] + }, + { + "id": 25, + "seek": 9484, + "start": 120.04, + "end": 123.1, + "text": " On peut adorer sa bagnole, en avoir besoin pour plein de choses.", + "tokens": [ + 51589, + 1282, + 5977, + 614, + 17618, + 601, + 3411, + 1771, + 306, + 11, + 465, + 10853, + 19207, + 2016, + 21088, + 368, + 14488, + 13, + 51789 + ], + "temperature": 0.0, + "avg_logprob": -0.0781538827078683, + "compression_ratio": 1.6719745222929936, + "no_speech_prob": 0.017434891313314438, + "confidence": 0.971, + "words": [ + { + "text": "On", + "start": 120.04, + "end": 120.16, + "confidence": 0.757 + }, + { + "text": "peut", + "start": 120.16, + "end": 120.36, + "confidence": 0.997 + }, + { + "text": "adorer", + "start": 120.36, + "end": 120.68, + "confidence": 0.991 + }, + { + "text": "sa", + "start": 120.68, + "end": 120.88, + "confidence": 0.98 + }, + { + "text": "bagnole,", + "start": 120.88, + "end": 121.34, + "confidence": 0.985 + }, + { + "text": "en", + "start": 121.42, + "end": 121.56, + "confidence": 0.971 + }, + { + "text": "avoir", + "start": 121.56, + "end": 121.8, + "confidence": 0.997 + }, + { + "text": "besoin", + "start": 121.8, + "end": 122.12, + "confidence": 0.999 + }, + { + "text": "pour", + "start": 122.12, + "end": 122.46, + "confidence": 0.989 + }, + { + "text": "plein", + "start": 122.46, + "end": 122.7, + "confidence": 0.987 + }, + { + "text": "de", + "start": 122.7, + "end": 122.78, + "confidence": 0.997 + }, + { + "text": "choses.", + "start": 122.78, + "end": 123.1, + "confidence": 0.99 + } + ] + }, + { + "id": 26, + "seek": 12334, + "start": 123.38, + "end": 126.44, + "text": " Le soir, quand on va se coucher, on la laisse.", + "tokens": [ + 50389, + 1456, + 27105, + 11, + 6932, + 322, + 2773, + 369, + 1384, + 6759, + 11, + 322, + 635, + 30969, + 13, + 50539 + ], + "temperature": 0.0, + "avg_logprob": -0.08272041363662548, + "compression_ratio": 1.6818181818181819, + "no_speech_prob": 0.01115426979959011, + "confidence": 0.94, + "words": [ + { + "text": "Le", + "start": 123.38, + "end": 123.96, + "confidence": 0.645 + }, + { + "text": "soir,", + "start": 123.96, + "end": 124.54, + "confidence": 0.998 + }, + { + "text": "quand", + "start": 124.74, + "end": 124.94, + "confidence": 0.982 + }, + { + "text": "on", + "start": 124.94, + "end": 125.06, + "confidence": 0.996 + }, + { + "text": "va", + "start": 125.06, + "end": 125.16, + "confidence": 0.99 + }, + { + "text": "se", + "start": 125.16, + "end": 125.26, + "confidence": 0.989 + }, + { + "text": "coucher,", + "start": 125.26, + "end": 125.7, + "confidence": 0.989 + }, + { + "text": "on", + "start": 125.94, + "end": 126.04, + "confidence": 0.992 + }, + { + "text": "la", + "start": 126.04, + "end": 126.18, + "confidence": 0.852 + }, + { + "text": "laisse.", + "start": 126.18, + "end": 126.44, + "confidence": 0.999 + } + ] + }, + { + "id": 27, + "seek": 12334, + "start": 127.0, + "end": 130.3, + "text": " On ne l'a pas dans la main quand on est au lit, on ne l'emmène pas au chiottes.", + "tokens": [ + 50539, + 1282, + 408, + 287, + 6, + 64, + 1736, + 2680, + 635, + 2135, + 6932, + 322, + 871, + 1609, + 7997, + 11, + 322, + 408, + 287, + 6, + 443, + 76, + 18832, + 1736, + 1609, + 13228, + 1521, + 279, + 13, + 50739 + ], + "temperature": 0.0, + "avg_logprob": -0.08272041363662548, + "compression_ratio": 1.6818181818181819, + "no_speech_prob": 0.01115426979959011, + "confidence": 0.918, + "words": [ + { + "text": "On", + "start": 127.0, + "end": 127.34, + "confidence": 0.967 + }, + { + "text": "ne", + "start": 127.34, + "end": 127.46, + "confidence": 0.801 + }, + { + "text": "l'a", + "start": 127.46, + "end": 127.56, + "confidence": 0.929 + }, + { + "text": "pas", + "start": 127.56, + "end": 127.68, + "confidence": 0.999 + }, + { + "text": "dans", + "start": 127.68, + "end": 127.86, + "confidence": 0.992 + }, + { + "text": "la", + "start": 127.86, + "end": 128.08, + "confidence": 0.996 + }, + { + "text": "main", + "start": 128.08, + "end": 128.26, + "confidence": 0.999 + }, + { + "text": "quand", + "start": 128.26, + "end": 128.48, + "confidence": 0.936 + }, + { + "text": "on", + "start": 128.48, + "end": 128.6, + "confidence": 0.993 + }, + { + "text": "est", + "start": 128.6, + "end": 128.74, + "confidence": 0.992 + }, + { + "text": "au", + "start": 128.74, + "end": 128.94, + "confidence": 0.976 + }, + { + "text": "lit,", + "start": 128.94, + "end": 129.1, + "confidence": 0.999 + }, + { + "text": "on", + "start": 129.16, + "end": 129.28, + "confidence": 0.43 + }, + { + "text": "ne", + "start": 129.28, + "end": 129.3, + "confidence": 0.949 + }, + { + "text": "l'emmène", + "start": 129.3, + "end": 129.58, + "confidence": 0.993 + }, + { + "text": "pas", + "start": 129.58, + "end": 129.7, + "confidence": 0.997 + }, + { + "text": "au", + "start": 129.7, + "end": 129.88, + "confidence": 0.72 + }, + { + "text": "chiottes.", + "start": 129.88, + "end": 130.3, + "confidence": 0.886 + } + ] + }, + { + "id": 28, + "seek": 12334, + "start": 130.84, + "end": 136.88, + "text": " On pouvait être énervé par son môme qui occupait la ligne de téléphone pendant une heure chaque soir pour discuter avec un copain.", + "tokens": [ + 50739, + 1282, + 45913, + 7418, + 45045, + 15797, + 971, + 1872, + 275, + 2851, + 1398, + 1956, + 8073, + 1001, + 635, + 34207, + 368, + 47159, + 17338, + 2251, + 30027, + 18920, + 27105, + 2016, + 2983, + 20314, + 4163, + 517, + 2971, + 491, + 13, + 51039 + ], + "temperature": 0.0, + "avg_logprob": -0.08272041363662548, + "compression_ratio": 1.6818181818181819, + "no_speech_prob": 0.01115426979959011, + "confidence": 0.925, + "words": [ + { + "text": "On", + "start": 130.84, + "end": 131.06, + "confidence": 0.996 + }, + { + "text": "pouvait", + "start": 131.06, + "end": 131.26, + "confidence": 0.989 + }, + { + "text": "être", + "start": 131.26, + "end": 131.58, + "confidence": 0.995 + }, + { + "text": "énervé", + "start": 131.58, + "end": 132.22, + "confidence": 0.896 + }, + { + "text": "par", + "start": 132.22, + "end": 132.46, + "confidence": 0.992 + }, + { + "text": "son", + "start": 132.46, + "end": 132.72, + "confidence": 0.998 + }, + { + "text": "môme", + "start": 132.72, + "end": 133.08, + "confidence": 0.758 + }, + { + "text": "qui", + "start": 133.08, + "end": 133.34, + "confidence": 0.916 + }, + { + "text": "occupait", + "start": 133.34, + "end": 133.74, + "confidence": 0.992 + }, + { + "text": "la", + "start": 133.74, + "end": 133.86, + "confidence": 0.986 + }, + { + "text": "ligne", + "start": 133.86, + "end": 134.06, + "confidence": 0.999 + }, + { + "text": "de", + "start": 134.06, + "end": 134.22, + "confidence": 0.995 + }, + { + "text": "téléphone", + "start": 134.22, + "end": 134.6, + "confidence": 0.992 + }, + { + "text": "pendant", + "start": 134.6, + "end": 134.92, + "confidence": 0.709 + }, + { + "text": "une", + "start": 134.92, + "end": 135.16, + "confidence": 0.78 + }, + { + "text": "heure", + "start": 135.16, + "end": 135.34, + "confidence": 0.995 + }, + { + "text": "chaque", + "start": 135.34, + "end": 135.58, + "confidence": 0.982 + }, + { + "text": "soir", + "start": 135.58, + "end": 135.8, + "confidence": 0.995 + }, + { + "text": "pour", + "start": 135.8, + "end": 135.98, + "confidence": 0.66 + }, + { + "text": "discuter", + "start": 135.98, + "end": 136.3, + "confidence": 0.997 + }, + { + "text": "avec", + "start": 136.3, + "end": 136.5, + "confidence": 0.995 + }, + { + "text": "un", + "start": 136.5, + "end": 136.66, + "confidence": 0.997 + }, + { + "text": "copain.", + "start": 136.66, + "end": 136.88, + "confidence": 0.996 + } + ] + }, + { + "id": 29, + "seek": 12334, + "start": 137.26, + "end": 141.86, + "text": " Mais ça ne ressemblait pas à ce qu'on peut ressentir à voir ce même môme aujourd'hui,", + "tokens": [ + 51039, + 6313, + 2788, + 408, + 725, + 15750, + 35235, + 1736, + 1531, + 1769, + 421, + 6, + 266, + 5977, + 24689, + 317, + 347, + 1531, + 10695, + 1769, + 5698, + 275, + 2851, + 1398, + 14023, + 6, + 10556, + 11, + 51289 + ], + "temperature": 0.0, + "avg_logprob": -0.08272041363662548, + "compression_ratio": 1.6818181818181819, + "no_speech_prob": 0.01115426979959011, + "confidence": 0.956, + "words": [ + { + "text": "Mais", + "start": 137.26, + "end": 137.5, + "confidence": 0.989 + }, + { + "text": "ça", + "start": 137.5, + "end": 137.68, + "confidence": 0.928 + }, + { + "text": "ne", + "start": 137.68, + "end": 137.88, + "confidence": 0.999 + }, + { + "text": "ressemblait", + "start": 137.88, + "end": 138.42, + "confidence": 0.993 + }, + { + "text": "pas", + "start": 138.42, + "end": 138.78, + "confidence": 0.994 + }, + { + "text": "à", + "start": 138.78, + "end": 138.9, + "confidence": 0.989 + }, + { + "text": "ce", + "start": 138.9, + "end": 138.98, + "confidence": 0.998 + }, + { + "text": "qu'on", + "start": 138.98, + "end": 139.12, + "confidence": 0.976 + }, + { + "text": "peut", + "start": 139.12, + "end": 139.48, + "confidence": 0.979 + }, + { + "text": "ressentir", + "start": 139.48, + "end": 140.1, + "confidence": 0.996 + }, + { + "text": "à", + "start": 140.1, + "end": 140.32, + "confidence": 0.575 + }, + { + "text": "voir", + "start": 140.32, + "end": 140.46, + "confidence": 0.728 + }, + { + "text": "ce", + "start": 140.46, + "end": 140.7, + "confidence": 0.985 + }, + { + "text": "même", + "start": 140.7, + "end": 140.94, + "confidence": 0.982 + }, + { + "text": "môme", + "start": 140.94, + "end": 141.28, + "confidence": 0.997 + }, + { + "text": "aujourd'hui,", + "start": 141.28, + "end": 141.86, + "confidence": 0.994 + } + ] + }, + { + "id": 30, + "seek": 12334, + "start": 142.16, + "end": 144.22, + "text": " continuellement avec son smartphone dans la main,", + "tokens": [ + 51289, + 2354, + 285, + 1712, + 4163, + 1872, + 13307, + 2680, + 635, + 2135, + 11, + 51414 + ], + "temperature": 0.0, + "avg_logprob": -0.08272041363662548, + "compression_ratio": 1.6818181818181819, + "no_speech_prob": 0.01115426979959011, + "confidence": 0.961, + "words": [ + { + "text": "continuellement", + "start": 142.16, + "end": 142.94, + "confidence": 0.963 + }, + { + "text": "avec", + "start": 142.94, + "end": 143.2, + "confidence": 0.844 + }, + { + "text": "son", + "start": 143.2, + "end": 143.42, + "confidence": 0.994 + }, + { + "text": "smartphone", + "start": 143.42, + "end": 143.76, + "confidence": 0.972 + }, + { + "text": "dans", + "start": 143.76, + "end": 143.92, + "confidence": 0.963 + }, + { + "text": "la", + "start": 143.92, + "end": 144.02, + "confidence": 0.997 + }, + { + "text": "main,", + "start": 144.02, + "end": 144.22, + "confidence": 0.997 + } + ] + }, + { + "id": 31, + "seek": 12334, + "start": 144.34, + "end": 148.8, + "text": " comme si c'était une sorte de pacemaker externe, comme si le lâcher allait entraîner sa mort immédiate.", + "tokens": [ + 51414, + 5173, + 1511, + 269, + 6, + 9743, + 2251, + 25559, + 368, + 15165, + 49523, + 454, + 391, + 716, + 11, + 5173, + 1511, + 476, + 48835, + 6759, + 439, + 1001, + 22284, + 7517, + 1193, + 601, + 6599, + 3397, + 526, + 4504, + 473, + 13, + 51639 + ], + "temperature": 0.0, + "avg_logprob": -0.08272041363662548, + "compression_ratio": 1.6818181818181819, + "no_speech_prob": 0.01115426979959011, + "confidence": 0.973, + "words": [ + { + "text": "comme", + "start": 144.34, + "end": 144.56, + "confidence": 0.985 + }, + { + "text": "si", + "start": 144.56, + "end": 144.66, + "confidence": 0.971 + }, + { + "text": "c'était", + "start": 144.66, + "end": 144.86, + "confidence": 0.987 + }, + { + "text": "une", + "start": 144.86, + "end": 144.98, + "confidence": 0.983 + }, + { + "text": "sorte", + "start": 144.98, + "end": 145.14, + "confidence": 0.992 + }, + { + "text": "de", + "start": 145.14, + "end": 145.34, + "confidence": 0.989 + }, + { + "text": "pacemaker", + "start": 145.34, + "end": 145.82, + "confidence": 0.931 + }, + { + "text": "externe,", + "start": 145.82, + "end": 146.4, + "confidence": 0.99 + }, + { + "text": "comme", + "start": 146.44, + "end": 146.6, + "confidence": 0.721 + }, + { + "text": "si", + "start": 146.6, + "end": 146.74, + "confidence": 0.993 + }, + { + "text": "le", + "start": 146.74, + "end": 147.0, + "confidence": 0.996 + }, + { + "text": "lâcher", + "start": 147.0, + "end": 147.36, + "confidence": 0.968 + }, + { + "text": "allait", + "start": 147.36, + "end": 147.58, + "confidence": 0.991 + }, + { + "text": "entraîner", + "start": 147.58, + "end": 147.88, + "confidence": 0.982 + }, + { + "text": "sa", + "start": 147.88, + "end": 148.02, + "confidence": 0.999 + }, + { + "text": "mort", + "start": 148.02, + "end": 148.3, + "confidence": 0.998 + }, + { + "text": "immédiate.", + "start": 148.3, + "end": 148.8, + "confidence": 0.998 + } + ] + }, + { + "id": 32, + "seek": 12334, + "start": 148.94, + "end": 152.02, + "text": " Bon, je dis ça pour le môme, mais c'est évidemment valable pour nous aussi.", + "tokens": [ + 51639, + 7368, + 11, + 1506, + 717, + 2788, + 2016, + 476, + 275, + 2851, + 1398, + 11, + 2420, + 269, + 6, + 377, + 24724, + 1323, + 712, + 2016, + 4666, + 6212, + 13, + 51839 + ], + "temperature": 0.0, + "avg_logprob": -0.08272041363662548, + "compression_ratio": 1.6818181818181819, + "no_speech_prob": 0.01115426979959011, + "confidence": 0.973, + "words": [ + { + "text": "Bon,", + "start": 148.94, + "end": 149.24, + "confidence": 0.804 + }, + { + "text": "je", + "start": 149.26, + "end": 149.34, + "confidence": 0.933 + }, + { + "text": "dis", + "start": 149.34, + "end": 149.46, + "confidence": 0.982 + }, + { + "text": "ça", + "start": 149.46, + "end": 149.64, + "confidence": 0.992 + }, + { + "text": "pour", + "start": 149.64, + "end": 149.78, + "confidence": 0.997 + }, + { + "text": "le", + "start": 149.78, + "end": 149.9, + "confidence": 0.994 + }, + { + "text": "môme,", + "start": 149.9, + "end": 150.1, + "confidence": 0.999 + }, + { + "text": "mais", + "start": 150.32, + "end": 150.5, + "confidence": 0.904 + }, + { + "text": "c'est", + "start": 150.5, + "end": 150.84, + "confidence": 0.979 + }, + { + "text": "évidemment", + "start": 150.84, + "end": 151.18, + "confidence": 0.979 + }, + { + "text": "valable", + "start": 151.18, + "end": 151.48, + "confidence": 0.997 + }, + { + "text": "pour", + "start": 151.48, + "end": 151.64, + "confidence": 0.996 + }, + { + "text": "nous", + "start": 151.64, + "end": 151.78, + "confidence": 0.998 + }, + { + "text": "aussi.", + "start": 151.78, + "end": 152.02, + "confidence": 0.997 + } + ] + }, + { + "id": 33, + "seek": 15284, + "start": 153.14, + "end": 154.68, + "text": " Donc, rapport inédit, d'accord.", + "tokens": [ + 50389, + 7477, + 11, + 18018, + 294, + 7811, + 270, + 11, + 274, + 6, + 19947, + 13, + 50489 + ], + "temperature": 0.0, + "avg_logprob": -0.12394786888444928, + "compression_ratio": 1.6703296703296704, + "no_speech_prob": 0.07031125575304031, + "confidence": 0.813, + "words": [ + { + "text": "Donc,", + "start": 153.14, + "end": 153.24, + "confidence": 0.232 + }, + { + "text": "rapport", + "start": 153.26, + "end": 153.62, + "confidence": 0.855 + }, + { + "text": "inédit,", + "start": 153.62, + "end": 154.18, + "confidence": 0.992 + }, + { + "text": "d'accord.", + "start": 154.28, + "end": 154.68, + "confidence": 0.997 + } + ] + }, + { + "id": 34, + "seek": 15284, + "start": 155.64, + "end": 158.52, + "text": " Mais pourquoi a-t-on l'impression qu'on n'en sortira jamais ?", + "tokens": [ + 50489, + 6313, + 19934, + 257, + 12, + 83, + 12, + 266, + 287, + 6, + 36107, + 421, + 6, + 266, + 297, + 6, + 268, + 1333, + 4271, + 14540, + 2506, + 50639 + ], + "temperature": 0.0, + "avg_logprob": -0.12394786888444928, + "compression_ratio": 1.6703296703296704, + "no_speech_prob": 0.07031125575304031, + "confidence": 0.958, + "words": [ + { + "text": "Mais", + "start": 155.64, + "end": 155.88, + "confidence": 0.991 + }, + { + "text": "pourquoi", + "start": 155.88, + "end": 156.36, + "confidence": 0.992 + }, + { + "text": "a-t-on", + "start": 156.36, + "end": 156.7, + "confidence": 0.95 + }, + { + "text": "l'impression", + "start": 156.7, + "end": 157.06, + "confidence": 0.998 + }, + { + "text": "qu'on", + "start": 157.06, + "end": 157.28, + "confidence": 0.99 + }, + { + "text": "n'en", + "start": 157.28, + "end": 157.5, + "confidence": 0.859 + }, + { + "text": "sortira", + "start": 157.5, + "end": 157.86, + "confidence": 0.974 + }, + { + "text": "jamais ?", + "start": 157.86, + "end": 158.52, + "confidence": 0.997 + } + ] + }, + { + "id": 35, + "seek": 15284, + "start": 159.12, + "end": 165.36, + "text": " Est-ce qu'il faut en remettre la faute sur les gens qui ont créé cet outil merveilleux et diabolique, et diabolique parce que merveilleux ?", + "tokens": [ + 50639, + 4410, + 12, + 384, + 421, + 6, + 388, + 8487, + 465, + 890, + 40681, + 635, + 2050, + 1169, + 1022, + 1512, + 10668, + 1956, + 6592, + 15609, + 526, + 8603, + 484, + 388, + 3551, + 303, + 3409, + 2449, + 1030, + 1026, + 14923, + 1925, + 11, + 1030, + 1026, + 14923, + 1925, + 6992, + 631, + 3551, + 303, + 3409, + 2449, + 2506, + 50989 + ], + "temperature": 0.0, + "avg_logprob": -0.12394786888444928, + "compression_ratio": 1.6703296703296704, + "no_speech_prob": 0.07031125575304031, + "confidence": 0.959, + "words": [ + { + "text": "Est-ce", + "start": 159.12, + "end": 159.34, + "confidence": 0.987 + }, + { + "text": "qu'il", + "start": 159.34, + "end": 159.46, + "confidence": 0.993 + }, + { + "text": "faut", + "start": 159.46, + "end": 159.64, + "confidence": 0.998 + }, + { + "text": "en", + "start": 159.64, + "end": 159.88, + "confidence": 0.961 + }, + { + "text": "remettre", + "start": 159.88, + "end": 160.14, + "confidence": 0.999 + }, + { + "text": "la", + "start": 160.14, + "end": 160.46, + "confidence": 0.995 + }, + { + "text": "faute", + "start": 160.46, + "end": 160.64, + "confidence": 0.986 + }, + { + "text": "sur", + "start": 160.64, + "end": 161.06, + "confidence": 0.982 + }, + { + "text": "les", + "start": 161.06, + "end": 161.3, + "confidence": 0.991 + }, + { + "text": "gens", + "start": 161.3, + "end": 161.46, + "confidence": 0.998 + }, + { + "text": "qui", + "start": 161.46, + "end": 161.56, + "confidence": 0.724 + }, + { + "text": "ont", + "start": 161.56, + "end": 161.82, + "confidence": 0.996 + }, + { + "text": "créé", + "start": 161.82, + "end": 162.28, + "confidence": 0.985 + }, + { + "text": "cet", + "start": 162.28, + "end": 162.48, + "confidence": 0.816 + }, + { + "text": "outil", + "start": 162.48, + "end": 162.78, + "confidence": 0.993 + }, + { + "text": "merveilleux", + "start": 162.78, + "end": 163.36, + "confidence": 0.981 + }, + { + "text": "et", + "start": 163.36, + "end": 163.5, + "confidence": 0.983 + }, + { + "text": "diabolique,", + "start": 163.5, + "end": 163.84, + "confidence": 0.991 + }, + { + "text": "et", + "start": 163.86, + "end": 164.0, + "confidence": 0.555 + }, + { + "text": "diabolique", + "start": 164.0, + "end": 164.4, + "confidence": 0.949 + }, + { + "text": "parce", + "start": 164.4, + "end": 164.66, + "confidence": 0.927 + }, + { + "text": "que", + "start": 164.66, + "end": 164.86, + "confidence": 0.979 + }, + { + "text": "merveilleux ?", + "start": 164.86, + "end": 165.36, + "confidence": 0.997 + } + ] + }, + { + "id": 36, + "seek": 15284, + "start": 166.84, + "end": 168.82, + "text": " Les économistes parlent de dépendance du sentier.", + "tokens": [ + 51039, + 6965, + 31171, + 22368, + 13734, + 317, + 368, + 45768, + 719, + 1581, + 2279, + 811, + 13, + 51139 + ], + "temperature": 0.0, + "avg_logprob": -0.12394786888444928, + "compression_ratio": 1.6703296703296704, + "no_speech_prob": 0.07031125575304031, + "confidence": 0.986, + "words": [ + { + "text": "Les", + "start": 166.84, + "end": 167.08, + "confidence": 0.945 + }, + { + "text": "économistes", + "start": 167.08, + "end": 167.46, + "confidence": 0.997 + }, + { + "text": "parlent", + "start": 167.46, + "end": 167.72, + "confidence": 0.993 + }, + { + "text": "de", + "start": 167.72, + "end": 167.88, + "confidence": 0.992 + }, + { + "text": "dépendance", + "start": 167.88, + "end": 168.34, + "confidence": 0.986 + }, + { + "text": "du", + "start": 168.34, + "end": 168.52, + "confidence": 0.996 + }, + { + "text": "sentier.", + "start": 168.52, + "end": 168.82, + "confidence": 0.983 + } + ] + }, + { + "id": 37, + "seek": 15284, + "start": 168.98, + "end": 177.38, + "text": " C'est l'idée qu'on met sur un sentier qui a été établi, soit volontairement en marchant dessus, soit en définissant des bornes, en définissant une signalétique.", + "tokens": [ + 51139, + 383, + 6, + 377, + 287, + 6, + 34281, + 421, + 6, + 266, + 1131, + 1022, + 517, + 2279, + 811, + 1956, + 257, + 8862, + 4823, + 455, + 2081, + 11, + 12703, + 40005, + 9020, + 518, + 465, + 8368, + 394, + 30677, + 11, + 12703, + 465, + 40763, + 29492, + 730, + 4232, + 279, + 11, + 465, + 40763, + 29492, + 2251, + 6358, + 42379, + 13, + 51589 + ], + "temperature": 0.0, + "avg_logprob": -0.12394786888444928, + "compression_ratio": 1.6703296703296704, + "no_speech_prob": 0.07031125575304031, + "confidence": 0.907, + "words": [ + { + "text": "C'est", + "start": 168.98, + "end": 169.2, + "confidence": 0.996 + }, + { + "text": "l'idée", + "start": 169.2, + "end": 169.38, + "confidence": 0.998 + }, + { + "text": "qu'on", + "start": 169.38, + "end": 169.74, + "confidence": 0.7 + }, + { + "text": "met", + "start": 169.74, + "end": 169.88, + "confidence": 0.648 + }, + { + "text": "sur", + "start": 169.88, + "end": 170.1, + "confidence": 0.995 + }, + { + "text": "un", + "start": 170.1, + "end": 170.52, + "confidence": 0.997 + }, + { + "text": "sentier", + "start": 170.52, + "end": 170.84, + "confidence": 0.991 + }, + { + "text": "qui", + "start": 170.84, + "end": 170.9, + "confidence": 0.955 + }, + { + "text": "a", + "start": 170.9, + "end": 171.0, + "confidence": 0.969 + }, + { + "text": "été", + "start": 171.0, + "end": 171.14, + "confidence": 0.994 + }, + { + "text": "établi,", + "start": 171.14, + "end": 171.5, + "confidence": 0.995 + }, + { + "text": "soit", + "start": 171.76, + "end": 172.1, + "confidence": 0.527 + }, + { + "text": "volontairement", + "start": 172.1, + "end": 172.7, + "confidence": 0.987 + }, + { + "text": "en", + "start": 172.7, + "end": 172.86, + "confidence": 0.927 + }, + { + "text": "marchant", + "start": 172.86, + "end": 173.1, + "confidence": 0.997 + }, + { + "text": "dessus,", + "start": 173.1, + "end": 173.48, + "confidence": 0.995 + }, + { + "text": "soit", + "start": 173.86, + "end": 174.28, + "confidence": 0.749 + }, + { + "text": "en", + "start": 174.28, + "end": 175.16, + "confidence": 0.967 + }, + { + "text": "définissant", + "start": 175.16, + "end": 175.54, + "confidence": 0.981 + }, + { + "text": "des", + "start": 175.54, + "end": 175.74, + "confidence": 0.99 + }, + { + "text": "bornes,", + "start": 175.74, + "end": 175.98, + "confidence": 0.977 + }, + { + "text": "en", + "start": 176.04, + "end": 176.14, + "confidence": 0.673 + }, + { + "text": "définissant", + "start": 176.14, + "end": 176.66, + "confidence": 0.996 + }, + { + "text": "une", + "start": 176.66, + "end": 176.94, + "confidence": 0.983 + }, + { + "text": "signalétique.", + "start": 176.94, + "end": 177.38, + "confidence": 0.686 + } + ] + } + ], + "language": "fr" +} \ No newline at end of file diff --git a/tests/expected/naive.cpu/accurate_apollo11.mp3.words.json b/tests/expected/naive.cpu/accurate_apollo11.mp3.words.json new file mode 100644 index 0000000000000000000000000000000000000000..960a425ed608e1568f8c2f523148e8ea33ebb33c --- /dev/null +++ b/tests/expected/naive.cpu/accurate_apollo11.mp3.words.json @@ -0,0 +1,2375 @@ +{ + "text": " Apollo 11, Houston, we got a recommendation for you on your Soyuz-EA GLEM-E-G-E-A. All right. Okay. Yeah, sir. Yeah, sir. Let's take that camera. Let's say it makes it want to go on the helmet we were going to have in B-1. The other one. And you can put the other one on the mic helmet. We'll show it to you in a quick screen. Over. All right. Yeah, sir. All right. Yeah, sir. There's a better helmet than B-1. That's the other one. Nice. Let's go in there. At least we're safe. We've got them in there. Helmet bags. And, uh, I guess we have helmets in the helmet bag. At least it's in the helmet bag. Right here. Right here. Yeah, we're taking it next day out of the field up. Hey, we were... You want to hack me on this? Hey, we were... You want to hack me on this? With a cover, I tried it already. Okay, fine. We weren't sure of that. Just a suggestion. We thought we'd... You could check it out. It's not much of an order to turn that. So, uh, I guess we're going to come up with this. Let us know. Okay. No problem. Okay. No problem. We'll let you know when the end of... None. Okay.", + "segments": [ + { + "id": 0, + "seek": 0, + "start": 0.64, + "end": 6.78, + "text": " Apollo 11, Houston, we got a recommendation for you on your Soyuz-EA GLEM-E-G-E-A.", + "tokens": [ + 25187, + 2975, + 11, + 18717, + 11, + 321, + 658, + 257, + 11879, + 337, + 291, + 322, + 428, + 24758, + 3334, + 12, + 36, + 32, + 460, + 2634, + 44, + 12, + 36, + 12, + 38, + 12, + 36, + 12, + 32, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.5336953440020161, + "compression_ratio": 1.4690265486725664, + "no_speech_prob": 0.45046156644821167, + "confidence": 0.578, + "words": [ + { + "text": "Apollo", + "start": 0.64, + "end": 0.98, + "confidence": 0.426 + }, + { + "text": "11,", + "start": 0.98, + "end": 1.54, + "confidence": 0.842 + }, + { + "text": "Houston,", + "start": 1.54, + "end": 1.96, + "confidence": 0.666 + }, + { + "text": "we", + "start": 1.96, + "end": 2.0, + "confidence": 0.983 + }, + { + "text": "got", + "start": 2.0, + "end": 2.16, + "confidence": 0.742 + }, + { + "text": "a", + "start": 2.16, + "end": 2.38, + "confidence": 0.993 + }, + { + "text": "recommendation", + "start": 2.38, + "end": 3.1, + "confidence": 0.977 + }, + { + "text": "for", + "start": 3.1, + "end": 3.54, + "confidence": 0.94 + }, + { + "text": "you", + "start": 3.54, + "end": 3.88, + "confidence": 0.993 + }, + { + "text": "on", + "start": 3.88, + "end": 4.26, + "confidence": 0.918 + }, + { + "text": "your", + "start": 4.26, + "end": 4.3, + "confidence": 0.976 + }, + { + "text": "Soyuz-EA", + "start": 4.3, + "end": 5.38, + "confidence": 0.453 + }, + { + "text": "GLEM-E-G-E-A.", + "start": 5.38, + "end": 6.78, + "confidence": 0.436 + } + ] + }, + { + "id": 1, + "seek": 0, + "start": 7.78, + "end": 10.46, + "text": " All right.", + "tokens": [ + 1057, + 558, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.5336953440020161, + "compression_ratio": 1.4690265486725664, + "no_speech_prob": 0.45046156644821167, + "confidence": 0.158, + "words": [ + { + "text": "All", + "start": 7.78, + "end": 7.82, + "confidence": 0.007 + }, + { + "text": "right.", + "start": 7.82, + "end": 10.46, + "confidence": 0.727 + } + ] + }, + { + "id": 2, + "seek": 0, + "start": 10.82, + "end": 11.38, + "text": " Okay.", + "tokens": [ + 1033, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.5336953440020161, + "compression_ratio": 1.4690265486725664, + "no_speech_prob": 0.45046156644821167, + "confidence": 0.105, + "words": [ + { + "text": "Okay.", + "start": 10.82, + "end": 11.38, + "confidence": 0.105 + } + ] + }, + { + "id": 3, + "seek": 0, + "start": 12.02, + "end": 13.44, + "text": " Yeah, sir.", + "tokens": [ + 865, + 11, + 4735, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.5336953440020161, + "compression_ratio": 1.4690265486725664, + "no_speech_prob": 0.45046156644821167, + "confidence": 0.101, + "words": [ + { + "text": "Yeah,", + "start": 12.02, + "end": 12.76, + "confidence": 0.076 + }, + { + "text": "sir.", + "start": 12.76, + "end": 13.44, + "confidence": 0.135 + } + ] + }, + { + "id": 4, + "seek": 0, + "start": 13.58, + "end": 14.02, + "text": " Yeah, sir.", + "tokens": [ + 865, + 11, + 4735, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.5336953440020161, + "compression_ratio": 1.4690265486725664, + "no_speech_prob": 0.45046156644821167, + "confidence": 0.052, + "words": [ + { + "text": "Yeah,", + "start": 13.58, + "end": 13.84, + "confidence": 0.108 + }, + { + "text": "sir.", + "start": 13.84, + "end": 14.02, + "confidence": 0.025 + } + ] + }, + { + "id": 5, + "seek": 0, + "start": 14.04, + "end": 14.6, + "text": " Let's take that camera.", + "tokens": [ + 961, + 311, + 747, + 300, + 2799, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.5336953440020161, + "compression_ratio": 1.4690265486725664, + "no_speech_prob": 0.45046156644821167, + "confidence": 0.082, + "words": [ + { + "text": "Let's", + "start": 14.04, + "end": 14.26, + "confidence": 0.043 + }, + { + "text": "take", + "start": 14.26, + "end": 14.3, + "confidence": 0.04 + }, + { + "text": "that", + "start": 14.3, + "end": 14.36, + "confidence": 0.055 + }, + { + "text": "camera.", + "start": 14.36, + "end": 14.6, + "confidence": 0.269 + } + ] + }, + { + "id": 6, + "seek": 0, + "start": 14.62, + "end": 19.16, + "text": " Let's say it makes it want to go on the helmet we were going to have in B-1.", + "tokens": [ + 961, + 311, + 584, + 309, + 1669, + 309, + 528, + 281, + 352, + 322, + 264, + 15922, + 321, + 645, + 516, + 281, + 362, + 294, + 363, + 12, + 16, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.5336953440020161, + "compression_ratio": 1.4690265486725664, + "no_speech_prob": 0.45046156644821167, + "confidence": 0.311, + "words": [ + { + "text": "Let's", + "start": 14.62, + "end": 15.34, + "confidence": 0.181 + }, + { + "text": "say", + "start": 15.34, + "end": 15.56, + "confidence": 0.451 + }, + { + "text": "it", + "start": 15.56, + "end": 15.76, + "confidence": 0.043 + }, + { + "text": "makes", + "start": 15.76, + "end": 15.8, + "confidence": 0.62 + }, + { + "text": "it", + "start": 15.8, + "end": 16.04, + "confidence": 0.943 + }, + { + "text": "want", + "start": 16.04, + "end": 16.22, + "confidence": 0.118 + }, + { + "text": "to", + "start": 16.22, + "end": 16.34, + "confidence": 0.953 + }, + { + "text": "go", + "start": 16.34, + "end": 16.46, + "confidence": 0.775 + }, + { + "text": "on", + "start": 16.46, + "end": 16.74, + "confidence": 0.939 + }, + { + "text": "the", + "start": 16.74, + "end": 16.88, + "confidence": 0.532 + }, + { + "text": "helmet", + "start": 16.88, + "end": 17.36, + "confidence": 0.003 + }, + { + "text": "we", + "start": 17.36, + "end": 17.64, + "confidence": 0.018 + }, + { + "text": "were", + "start": 17.64, + "end": 17.86, + "confidence": 0.255 + }, + { + "text": "going", + "start": 17.86, + "end": 18.06, + "confidence": 0.654 + }, + { + "text": "to", + "start": 18.06, + "end": 18.26, + "confidence": 0.966 + }, + { + "text": "have", + "start": 18.26, + "end": 18.3, + "confidence": 0.967 + }, + { + "text": "in", + "start": 18.3, + "end": 18.46, + "confidence": 0.899 + }, + { + "text": "B-1.", + "start": 18.46, + "end": 19.16, + "confidence": 0.489 + } + ] + }, + { + "id": 7, + "seek": 0, + "start": 19.4, + "end": 19.94, + "text": " The other one.", + "tokens": [ + 440, + 661, + 472, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.5336953440020161, + "compression_ratio": 1.4690265486725664, + "no_speech_prob": 0.45046156644821167, + "confidence": 0.127, + "words": [ + { + "text": "The", + "start": 19.4, + "end": 19.44, + "confidence": 0.004 + }, + { + "text": "other", + "start": 19.44, + "end": 19.7, + "confidence": 0.144 + }, + { + "text": "one.", + "start": 19.7, + "end": 19.94, + "confidence": 0.656 + } + ] + }, + { + "id": 8, + "seek": 0, + "start": 20.12, + "end": 22.92, + "text": " And you can put the other one on the mic helmet.", + "tokens": [ + 400, + 291, + 393, + 829, + 264, + 661, + 472, + 322, + 264, + 3123, + 15922, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.5336953440020161, + "compression_ratio": 1.4690265486725664, + "no_speech_prob": 0.45046156644821167, + "confidence": 0.394, + "words": [ + { + "text": "And", + "start": 20.12, + "end": 20.26, + "confidence": 0.358 + }, + { + "text": "you", + "start": 20.26, + "end": 20.38, + "confidence": 0.915 + }, + { + "text": "can", + "start": 20.38, + "end": 20.54, + "confidence": 0.122 + }, + { + "text": "put", + "start": 20.54, + "end": 20.7, + "confidence": 0.92 + }, + { + "text": "the", + "start": 20.7, + "end": 20.88, + "confidence": 0.981 + }, + { + "text": "other", + "start": 20.88, + "end": 21.06, + "confidence": 0.997 + }, + { + "text": "one", + "start": 21.06, + "end": 21.26, + "confidence": 0.97 + }, + { + "text": "on", + "start": 21.26, + "end": 22.14, + "confidence": 0.971 + }, + { + "text": "the", + "start": 22.14, + "end": 22.18, + "confidence": 0.085 + }, + { + "text": "mic", + "start": 22.18, + "end": 22.62, + "confidence": 0.679 + }, + { + "text": "helmet.", + "start": 22.62, + "end": 22.92, + "confidence": 0.085 + } + ] + }, + { + "id": 9, + "seek": 0, + "start": 22.94, + "end": 24.58, + "text": " We'll show it to you in a quick screen.", + "tokens": [ + 492, + 603, + 855, + 309, + 281, + 291, + 294, + 257, + 1702, + 2568, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.5336953440020161, + "compression_ratio": 1.4690265486725664, + "no_speech_prob": 0.45046156644821167, + "confidence": 0.124, + "words": [ + { + "text": "We'll", + "start": 22.94, + "end": 23.32, + "confidence": 0.098 + }, + { + "text": "show", + "start": 23.32, + "end": 23.36, + "confidence": 0.008 + }, + { + "text": "it", + "start": 23.36, + "end": 23.54, + "confidence": 0.167 + }, + { + "text": "to", + "start": 23.54, + "end": 23.64, + "confidence": 0.268 + }, + { + "text": "you", + "start": 23.64, + "end": 23.8, + "confidence": 0.656 + }, + { + "text": "in", + "start": 23.8, + "end": 23.98, + "confidence": 0.246 + }, + { + "text": "a", + "start": 23.98, + "end": 24.02, + "confidence": 0.683 + }, + { + "text": "quick", + "start": 24.02, + "end": 24.14, + "confidence": 0.022 + }, + { + "text": "screen.", + "start": 24.14, + "end": 24.58, + "confidence": 0.114 + } + ] + }, + { + "id": 10, + "seek": 0, + "start": 24.94, + "end": 25.18, + "text": " Over.", + "tokens": [ + 4886, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.5336953440020161, + "compression_ratio": 1.4690265486725664, + "no_speech_prob": 0.45046156644821167, + "confidence": 0.117, + "words": [ + { + "text": "Over.", + "start": 24.94, + "end": 25.18, + "confidence": 0.117 + } + ] + }, + { + "id": 11, + "seek": 2600, + "start": 25.52, + "end": 27.48, + "text": " All right.", + "tokens": [ + 1057, + 558, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.5317274729410807, + "compression_ratio": 1.728643216080402, + "no_speech_prob": 0.0011296384036540985, + "confidence": 0.094, + "words": [ + { + "text": "All", + "start": 25.52, + "end": 25.56, + "confidence": 0.002 + }, + { + "text": "right.", + "start": 25.56, + "end": 27.48, + "confidence": 0.622 + } + ] + }, + { + "id": 12, + "seek": 2600, + "start": 31.32, + "end": 32.12, + "text": " Yeah, sir.", + "tokens": [ + 865, + 11, + 4735, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.5317274729410807, + "compression_ratio": 1.728643216080402, + "no_speech_prob": 0.0011296384036540985, + "confidence": 0.045, + "words": [ + { + "text": "Yeah,", + "start": 31.32, + "end": 31.6, + "confidence": 0.032 + }, + { + "text": "sir.", + "start": 31.6, + "end": 32.12, + "confidence": 0.063 + } + ] + }, + { + "id": 13, + "seek": 2600, + "start": 32.66, + "end": 33.06, + "text": " All right.", + "tokens": [ + 1057, + 558, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.5317274729410807, + "compression_ratio": 1.728643216080402, + "no_speech_prob": 0.0011296384036540985, + "confidence": 0.199, + "words": [ + { + "text": "All", + "start": 32.66, + "end": 32.94, + "confidence": 0.025 + }, + { + "text": "right.", + "start": 32.94, + "end": 33.06, + "confidence": 0.56 + } + ] + }, + { + "id": 14, + "seek": 2600, + "start": 33.08, + "end": 33.56, + "text": " Yeah, sir.", + "tokens": [ + 865, + 11, + 4735, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.5317274729410807, + "compression_ratio": 1.728643216080402, + "no_speech_prob": 0.0011296384036540985, + "confidence": 0.036, + "words": [ + { + "text": "Yeah,", + "start": 33.08, + "end": 33.38, + "confidence": 0.145 + }, + { + "text": "sir.", + "start": 33.38, + "end": 33.56, + "confidence": 0.009 + } + ] + }, + { + "id": 15, + "seek": 2600, + "start": 33.58, + "end": 35.12, + "text": " There's a better helmet than B-1.", + "tokens": [ + 821, + 311, + 257, + 1101, + 15922, + 813, + 363, + 12, + 16, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.5317274729410807, + "compression_ratio": 1.728643216080402, + "no_speech_prob": 0.0011296384036540985, + "confidence": 0.046, + "words": [ + { + "text": "There's", + "start": 33.58, + "end": 33.96, + "confidence": 0.035 + }, + { + "text": "a", + "start": 33.96, + "end": 34.0, + "confidence": 0.302 + }, + { + "text": "better", + "start": 34.0, + "end": 34.04, + "confidence": 0.037 + }, + { + "text": "helmet", + "start": 34.04, + "end": 34.36, + "confidence": 0.009 + }, + { + "text": "than", + "start": 34.36, + "end": 34.7, + "confidence": 0.386 + }, + { + "text": "B-1.", + "start": 34.7, + "end": 35.12, + "confidence": 0.031 + } + ] + }, + { + "id": 16, + "seek": 2600, + "start": 35.14, + "end": 35.96, + "text": " That's the other one.", + "tokens": [ + 663, + 311, + 264, + 661, + 472, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.5317274729410807, + "compression_ratio": 1.728643216080402, + "no_speech_prob": 0.0011296384036540985, + "confidence": 0.259, + "words": [ + { + "text": "That's", + "start": 35.14, + "end": 35.48, + "confidence": 0.114 + }, + { + "text": "the", + "start": 35.48, + "end": 35.52, + "confidence": 0.609 + }, + { + "text": "other", + "start": 35.52, + "end": 35.7, + "confidence": 0.954 + }, + { + "text": "one.", + "start": 35.7, + "end": 35.96, + "confidence": 0.2 + } + ] + }, + { + "id": 17, + "seek": 2600, + "start": 35.98, + "end": 36.24, + "text": " Nice.", + "tokens": [ + 5490, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.5317274729410807, + "compression_ratio": 1.728643216080402, + "no_speech_prob": 0.0011296384036540985, + "confidence": 0.008, + "words": [ + { + "text": "Nice.", + "start": 35.98, + "end": 36.24, + "confidence": 0.008 + } + ] + }, + { + "id": 18, + "seek": 2600, + "start": 37.5, + "end": 38.44, + "text": " Let's go in there.", + "tokens": [ + 961, + 311, + 352, + 294, + 456, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.5317274729410807, + "compression_ratio": 1.728643216080402, + "no_speech_prob": 0.0011296384036540985, + "confidence": 0.127, + "words": [ + { + "text": "Let's", + "start": 37.5, + "end": 38.16, + "confidence": 0.024 + }, + { + "text": "go", + "start": 38.16, + "end": 38.2, + "confidence": 0.624 + }, + { + "text": "in", + "start": 38.2, + "end": 38.3, + "confidence": 0.037 + }, + { + "text": "there.", + "start": 38.3, + "end": 38.44, + "confidence": 0.571 + } + ] + }, + { + "id": 19, + "seek": 2600, + "start": 38.6, + "end": 39.26, + "text": " At least we're safe.", + "tokens": [ + 1711, + 1935, + 321, + 434, + 3273, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.5317274729410807, + "compression_ratio": 1.728643216080402, + "no_speech_prob": 0.0011296384036540985, + "confidence": 0.14, + "words": [ + { + "text": "At", + "start": 38.6, + "end": 38.64, + "confidence": 0.002 + }, + { + "text": "least", + "start": 38.64, + "end": 38.84, + "confidence": 0.269 + }, + { + "text": "we're", + "start": 38.84, + "end": 39.18, + "confidence": 0.138 + }, + { + "text": "safe.", + "start": 39.18, + "end": 39.26, + "confidence": 0.802 + } + ] + }, + { + "id": 20, + "seek": 2600, + "start": 39.92, + "end": 40.52, + "text": " We've got them in there.", + "tokens": [ + 492, + 600, + 658, + 552, + 294, + 456, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.5317274729410807, + "compression_ratio": 1.728643216080402, + "no_speech_prob": 0.0011296384036540985, + "confidence": 0.071, + "words": [ + { + "text": "We've", + "start": 39.92, + "end": 40.36, + "confidence": 0.042 + }, + { + "text": "got", + "start": 40.36, + "end": 40.4, + "confidence": 0.682 + }, + { + "text": "them", + "start": 40.4, + "end": 40.44, + "confidence": 0.004 + }, + { + "text": "in", + "start": 40.44, + "end": 40.48, + "confidence": 0.041 + }, + { + "text": "there.", + "start": 40.48, + "end": 40.52, + "confidence": 0.216 + } + ] + }, + { + "id": 21, + "seek": 2600, + "start": 40.52, + "end": 41.1, + "text": " Helmet bags.", + "tokens": [ + 6128, + 5537, + 10405, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.5317274729410807, + "compression_ratio": 1.728643216080402, + "no_speech_prob": 0.0011296384036540985, + "confidence": 0.002, + "words": [ + { + "text": "Helmet", + "start": 40.52, + "end": 40.8, + "confidence": 0.002 + }, + { + "text": "bags.", + "start": 40.8, + "end": 41.1, + "confidence": 0.002 + } + ] + }, + { + "id": 22, + "seek": 2600, + "start": 41.12, + "end": 43.1, + "text": " And, uh, I guess we have helmets in the helmet bag.", + "tokens": [ + 400, + 11, + 2232, + 11, + 286, + 2041, + 321, + 362, + 42022, + 294, + 264, + 15922, + 3411, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.5317274729410807, + "compression_ratio": 1.728643216080402, + "no_speech_prob": 0.0011296384036540985, + "confidence": 0.036, + "words": [ + { + "text": "And,", + "start": 41.12, + "end": 41.5, + "confidence": 0.02 + }, + { + "text": "uh,", + "start": 41.5, + "end": 41.54, + "confidence": 0.55 + }, + { + "text": "I", + "start": 41.54, + "end": 41.58, + "confidence": 0.409 + }, + { + "text": "guess", + "start": 41.58, + "end": 41.64, + "confidence": 0.031 + }, + { + "text": "we", + "start": 41.64, + "end": 41.68, + "confidence": 0.059 + }, + { + "text": "have", + "start": 41.68, + "end": 41.72, + "confidence": 0.018 + }, + { + "text": "helmets", + "start": 41.72, + "end": 41.76, + "confidence": 0.0 + }, + { + "text": "in", + "start": 41.76, + "end": 42.08, + "confidence": 0.025 + }, + { + "text": "the", + "start": 42.08, + "end": 42.38, + "confidence": 0.214 + }, + { + "text": "helmet", + "start": 42.38, + "end": 43.06, + "confidence": 0.001 + }, + { + "text": "bag.", + "start": 43.06, + "end": 43.1, + "confidence": 0.611 + } + ] + }, + { + "id": 23, + "seek": 2600, + "start": 43.56, + "end": 47.42, + "text": " At least it's in the helmet bag.", + "tokens": [ + 1711, + 1935, + 309, + 311, + 294, + 264, + 15922, + 3411, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.5317274729410807, + "compression_ratio": 1.728643216080402, + "no_speech_prob": 0.0011296384036540985, + "confidence": 0.051, + "words": [ + { + "text": "At", + "start": 43.56, + "end": 44.06, + "confidence": 0.001 + }, + { + "text": "least", + "start": 44.06, + "end": 44.32, + "confidence": 0.325 + }, + { + "text": "it's", + "start": 44.32, + "end": 44.9, + "confidence": 0.169 + }, + { + "text": "in", + "start": 44.9, + "end": 45.46, + "confidence": 0.03 + }, + { + "text": "the", + "start": 45.46, + "end": 45.5, + "confidence": 0.345 + }, + { + "text": "helmet", + "start": 45.5, + "end": 46.54, + "confidence": 0.004 + }, + { + "text": "bag.", + "start": 46.54, + "end": 47.42, + "confidence": 0.095 + } + ] + }, + { + "id": 24, + "seek": 2600, + "start": 48.22, + "end": 48.44, + "text": " Right here.", + "tokens": [ + 1779, + 510, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.5317274729410807, + "compression_ratio": 1.728643216080402, + "no_speech_prob": 0.0011296384036540985, + "confidence": 0.02, + "words": [ + { + "text": "Right", + "start": 48.22, + "end": 48.26, + "confidence": 0.0 + }, + { + "text": "here.", + "start": 48.26, + "end": 48.44, + "confidence": 0.167 + } + ] + }, + { + "id": 25, + "seek": 2600, + "start": 48.46, + "end": 48.76, + "text": " Right here.", + "tokens": [ + 1779, + 510, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.5317274729410807, + "compression_ratio": 1.728643216080402, + "no_speech_prob": 0.0011296384036540985, + "confidence": 0.018, + "words": [ + { + "text": "Right", + "start": 48.46, + "end": 48.56, + "confidence": 0.001 + }, + { + "text": "here.", + "start": 48.56, + "end": 48.76, + "confidence": 0.078 + } + ] + }, + { + "id": 26, + "seek": 2600, + "start": 48.78, + "end": 55.4, + "text": " Yeah, we're taking it next day out of the field up.", + "tokens": [ + 865, + 11, + 321, + 434, + 1940, + 309, + 958, + 786, + 484, + 295, + 264, + 2519, + 493, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.5317274729410807, + "compression_ratio": 1.728643216080402, + "no_speech_prob": 0.0011296384036540985, + "confidence": 0.285, + "words": [ + { + "text": "Yeah,", + "start": 48.78, + "end": 52.1, + "confidence": 0.124 + }, + { + "text": "we're", + "start": 52.1, + "end": 53.64, + "confidence": 0.622 + }, + { + "text": "taking", + "start": 53.64, + "end": 53.68, + "confidence": 0.352 + }, + { + "text": "it", + "start": 53.68, + "end": 53.76, + "confidence": 0.114 + }, + { + "text": "next", + "start": 53.76, + "end": 53.98, + "confidence": 0.411 + }, + { + "text": "day", + "start": 53.98, + "end": 54.2, + "confidence": 0.888 + }, + { + "text": "out", + "start": 54.2, + "end": 54.32, + "confidence": 0.322 + }, + { + "text": "of", + "start": 54.32, + "end": 54.56, + "confidence": 0.473 + }, + { + "text": "the", + "start": 54.56, + "end": 54.7, + "confidence": 0.357 + }, + { + "text": "field", + "start": 54.7, + "end": 55.2, + "confidence": 0.051 + }, + { + "text": "up.", + "start": 55.2, + "end": 55.4, + "confidence": 0.31 + } + ] + }, + { + "id": 27, + "seek": 5500, + "start": 55.42, + "end": 56.32, + "text": " Hey, we were...", + "tokens": [ + 1911, + 11, + 321, + 645, + 485 + ], + "temperature": 0.0, + "avg_logprob": -0.32385124256408293, + "compression_ratio": 1.7088607594936709, + "no_speech_prob": 0.0003275917551945895, + "confidence": 0.009, + "words": [ + { + "text": "Hey,", + "start": 55.42, + "end": 56.24, + "confidence": 0.015 + }, + { + "text": "we", + "start": 56.24, + "end": 56.28, + "confidence": 0.014 + }, + { + "text": "were...", + "start": 56.28, + "end": 56.32, + "confidence": 0.004 + } + ] + }, + { + "id": 28, + "seek": 5500, + "start": 56.5, + "end": 57.52, + "text": " You want to hack me on this?", + "tokens": [ + 509, + 528, + 281, + 10339, + 385, + 322, + 341, + 30 + ], + "temperature": 0.0, + "avg_logprob": -0.32385124256408293, + "compression_ratio": 1.7088607594936709, + "no_speech_prob": 0.0003275917551945895, + "confidence": 0.022, + "words": [ + { + "text": "You", + "start": 56.5, + "end": 56.64, + "confidence": 0.006 + }, + { + "text": "want", + "start": 56.64, + "end": 57.02, + "confidence": 0.007 + }, + { + "text": "to", + "start": 57.02, + "end": 57.36, + "confidence": 0.345 + }, + { + "text": "hack", + "start": 57.36, + "end": 57.4, + "confidence": 0.0 + }, + { + "text": "me", + "start": 57.4, + "end": 57.44, + "confidence": 0.088 + }, + { + "text": "on", + "start": 57.44, + "end": 57.48, + "confidence": 0.004 + }, + { + "text": "this?", + "start": 57.48, + "end": 57.52, + "confidence": 0.177 + } + ] + }, + { + "id": 29, + "seek": 5500, + "start": 57.52, + "end": 58.44, + "text": " Hey, we were...", + "tokens": [ + 1911, + 11, + 321, + 645, + 485 + ], + "temperature": 0.0, + "avg_logprob": -0.32385124256408293, + "compression_ratio": 1.7088607594936709, + "no_speech_prob": 0.0003275917551945895, + "confidence": 0.048, + "words": [ + { + "text": "Hey,", + "start": 57.52, + "end": 57.98, + "confidence": 0.033 + }, + { + "text": "we", + "start": 57.98, + "end": 58.14, + "confidence": 0.391 + }, + { + "text": "were...", + "start": 58.14, + "end": 58.44, + "confidence": 0.024 + } + ] + }, + { + "id": 30, + "seek": 5500, + "start": 58.46, + "end": 59.44, + "text": " You want to hack me on this?", + "tokens": [ + 509, + 528, + 281, + 10339, + 385, + 322, + 341, + 30 + ], + "temperature": 0.0, + "avg_logprob": -0.32385124256408293, + "compression_ratio": 1.7088607594936709, + "no_speech_prob": 0.0003275917551945895, + "confidence": 0.04, + "words": [ + { + "text": "You", + "start": 58.46, + "end": 58.7, + "confidence": 0.014 + }, + { + "text": "want", + "start": 58.7, + "end": 58.74, + "confidence": 0.017 + }, + { + "text": "to", + "start": 58.74, + "end": 58.78, + "confidence": 0.336 + }, + { + "text": "hack", + "start": 58.78, + "end": 58.82, + "confidence": 0.0 + }, + { + "text": "me", + "start": 58.82, + "end": 59.0, + "confidence": 0.417 + }, + { + "text": "on", + "start": 59.0, + "end": 59.2, + "confidence": 0.277 + }, + { + "text": "this?", + "start": 59.2, + "end": 59.44, + "confidence": 0.138 + } + ] + }, + { + "id": 31, + "seek": 5500, + "start": 59.76, + "end": 61.48, + "text": " With a cover, I tried it already.", + "tokens": [ + 2022, + 257, + 2060, + 11, + 286, + 3031, + 309, + 1217, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.32385124256408293, + "compression_ratio": 1.7088607594936709, + "no_speech_prob": 0.0003275917551945895, + "confidence": 0.064, + "words": [ + { + "text": "With", + "start": 59.76, + "end": 60.12, + "confidence": 0.027 + }, + { + "text": "a", + "start": 60.12, + "end": 60.84, + "confidence": 0.553 + }, + { + "text": "cover,", + "start": 60.84, + "end": 61.32, + "confidence": 0.167 + }, + { + "text": "I", + "start": 61.32, + "end": 61.36, + "confidence": 0.846 + }, + { + "text": "tried", + "start": 61.36, + "end": 61.4, + "confidence": 0.046 + }, + { + "text": "it", + "start": 61.4, + "end": 61.44, + "confidence": 0.011 + }, + { + "text": "already.", + "start": 61.44, + "end": 61.48, + "confidence": 0.01 + } + ] + }, + { + "id": 32, + "seek": 5500, + "start": 62.38, + "end": 62.46, + "text": " Okay, fine.", + "tokens": [ + 1033, + 11, + 2489, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.32385124256408293, + "compression_ratio": 1.7088607594936709, + "no_speech_prob": 0.0003275917551945895, + "confidence": 0.062, + "words": [ + { + "text": "Okay,", + "start": 62.38, + "end": 62.42, + "confidence": 0.06 + }, + { + "text": "fine.", + "start": 62.42, + "end": 62.46, + "confidence": 0.065 + } + ] + }, + { + "id": 33, + "seek": 5500, + "start": 62.56, + "end": 63.44, + "text": " We weren't sure of that.", + "tokens": [ + 492, + 4999, + 380, + 988, + 295, + 300, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.32385124256408293, + "compression_ratio": 1.7088607594936709, + "no_speech_prob": 0.0003275917551945895, + "confidence": 0.043, + "words": [ + { + "text": "We", + "start": 62.56, + "end": 63.06, + "confidence": 0.003 + }, + { + "text": "weren't", + "start": 63.06, + "end": 63.1, + "confidence": 0.155 + }, + { + "text": "sure", + "start": 63.1, + "end": 63.14, + "confidence": 0.01 + }, + { + "text": "of", + "start": 63.14, + "end": 63.18, + "confidence": 0.018 + }, + { + "text": "that.", + "start": 63.18, + "end": 63.44, + "confidence": 0.144 + } + ] + }, + { + "id": 34, + "seek": 5500, + "start": 63.46, + "end": 63.78, + "text": " Just a suggestion.", + "tokens": [ + 1449, + 257, + 16541, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.32385124256408293, + "compression_ratio": 1.7088607594936709, + "no_speech_prob": 0.0003275917551945895, + "confidence": 0.004, + "words": [ + { + "text": "Just", + "start": 63.46, + "end": 63.5, + "confidence": 0.003 + }, + { + "text": "a", + "start": 63.5, + "end": 63.74, + "confidence": 0.015 + }, + { + "text": "suggestion.", + "start": 63.74, + "end": 63.78, + "confidence": 0.002 + } + ] + }, + { + "id": 35, + "seek": 5500, + "start": 63.78, + "end": 65.26, + "text": " We thought we'd...", + "tokens": [ + 492, + 1194, + 321, + 1116, + 485 + ], + "temperature": 0.0, + "avg_logprob": -0.32385124256408293, + "compression_ratio": 1.7088607594936709, + "no_speech_prob": 0.0003275917551945895, + "confidence": 0.011, + "words": [ + { + "text": "We", + "start": 63.78, + "end": 64.9, + "confidence": 0.003 + }, + { + "text": "thought", + "start": 64.9, + "end": 65.2, + "confidence": 0.001 + }, + { + "text": "we'd...", + "start": 65.2, + "end": 65.26, + "confidence": 0.036 + } + ] + }, + { + "id": 36, + "seek": 5500, + "start": 66.26, + "end": 66.46, + "text": " You could check it out.", + "tokens": [ + 509, + 727, + 1520, + 309, + 484, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.32385124256408293, + "compression_ratio": 1.7088607594936709, + "no_speech_prob": 0.0003275917551945895, + "confidence": 0.03, + "words": [ + { + "text": "You", + "start": 66.26, + "end": 66.3, + "confidence": 0.004 + }, + { + "text": "could", + "start": 66.3, + "end": 66.34, + "confidence": 0.002 + }, + { + "text": "check", + "start": 66.34, + "end": 66.38, + "confidence": 0.003 + }, + { + "text": "it", + "start": 66.38, + "end": 66.42, + "confidence": 0.16 + }, + { + "text": "out.", + "start": 66.42, + "end": 66.46, + "confidence": 0.442 + } + ] + }, + { + "id": 37, + "seek": 5500, + "start": 66.82, + "end": 69.34, + "text": " It's not much of an order to turn that.", + "tokens": [ + 467, + 311, + 406, + 709, + 295, + 364, + 1668, + 281, + 1261, + 300, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.32385124256408293, + "compression_ratio": 1.7088607594936709, + "no_speech_prob": 0.0003275917551945895, + "confidence": 0.136, + "words": [ + { + "text": "It's", + "start": 66.82, + "end": 67.32, + "confidence": 0.035 + }, + { + "text": "not", + "start": 67.32, + "end": 68.36, + "confidence": 0.025 + }, + { + "text": "much", + "start": 68.36, + "end": 68.62, + "confidence": 0.683 + }, + { + "text": "of", + "start": 68.62, + "end": 68.8, + "confidence": 0.59 + }, + { + "text": "an", + "start": 68.8, + "end": 68.86, + "confidence": 0.137 + }, + { + "text": "order", + "start": 68.86, + "end": 68.96, + "confidence": 0.142 + }, + { + "text": "to", + "start": 68.96, + "end": 69.16, + "confidence": 0.043 + }, + { + "text": "turn", + "start": 69.16, + "end": 69.2, + "confidence": 0.1 + }, + { + "text": "that.", + "start": 69.2, + "end": 69.34, + "confidence": 0.536 + } + ] + }, + { + "id": 38, + "seek": 5500, + "start": 70.32, + "end": 72.02, + "text": " So, uh, I guess we're going to come up with this.", + "tokens": [ + 407, + 11, + 2232, + 11, + 286, + 2041, + 321, + 434, + 516, + 281, + 808, + 493, + 365, + 341, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.32385124256408293, + "compression_ratio": 1.7088607594936709, + "no_speech_prob": 0.0003275917551945895, + "confidence": 0.495, + "words": [ + { + "text": "So,", + "start": 70.32, + "end": 70.36, + "confidence": 0.528 + }, + { + "text": "uh,", + "start": 70.36, + "end": 70.5, + "confidence": 0.497 + }, + { + "text": "I", + "start": 70.5, + "end": 70.54, + "confidence": 0.958 + }, + { + "text": "guess", + "start": 70.54, + "end": 70.84, + "confidence": 0.986 + }, + { + "text": "we're", + "start": 70.84, + "end": 71.12, + "confidence": 0.504 + }, + { + "text": "going", + "start": 71.12, + "end": 71.3, + "confidence": 0.143 + }, + { + "text": "to", + "start": 71.3, + "end": 71.48, + "confidence": 0.956 + }, + { + "text": "come", + "start": 71.48, + "end": 71.52, + "confidence": 0.547 + }, + { + "text": "up", + "start": 71.52, + "end": 71.7, + "confidence": 0.796 + }, + { + "text": "with", + "start": 71.7, + "end": 71.88, + "confidence": 0.807 + }, + { + "text": "this.", + "start": 71.88, + "end": 72.02, + "confidence": 0.181 + } + ] + }, + { + "id": 39, + "seek": 5500, + "start": 72.04, + "end": 72.52, + "text": " Let us know.", + "tokens": [ + 961, + 505, + 458, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.32385124256408293, + "compression_ratio": 1.7088607594936709, + "no_speech_prob": 0.0003275917551945895, + "confidence": 0.323, + "words": [ + { + "text": "Let", + "start": 72.04, + "end": 72.14, + "confidence": 0.076 + }, + { + "text": "us", + "start": 72.14, + "end": 72.34, + "confidence": 0.304 + }, + { + "text": "know.", + "start": 72.34, + "end": 72.52, + "confidence": 0.686 + } + ] + }, + { + "id": 40, + "seek": 5500, + "start": 72.54, + "end": 72.7, + "text": " Okay.", + "tokens": [ + 1033, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.32385124256408293, + "compression_ratio": 1.7088607594936709, + "no_speech_prob": 0.0003275917551945895, + "confidence": 0.026, + "words": [ + { + "text": "Okay.", + "start": 72.54, + "end": 72.7, + "confidence": 0.026 + } + ] + }, + { + "id": 41, + "seek": 5500, + "start": 74.2, + "end": 75.16, + "text": " No problem.", + "tokens": [ + 883, + 1154, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.32385124256408293, + "compression_ratio": 1.7088607594936709, + "no_speech_prob": 0.0003275917551945895, + "confidence": 0.082, + "words": [ + { + "text": "No", + "start": 74.2, + "end": 74.42, + "confidence": 0.004 + }, + { + "text": "problem.", + "start": 74.42, + "end": 75.16, + "confidence": 0.351 + } + ] + }, + { + "id": 42, + "seek": 5500, + "start": 75.18, + "end": 75.9, + "text": " Okay.", + "tokens": [ + 1033, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.32385124256408293, + "compression_ratio": 1.7088607594936709, + "no_speech_prob": 0.0003275917551945895, + "confidence": 0.237, + "words": [ + { + "text": "Okay.", + "start": 75.18, + "end": 75.9, + "confidence": 0.237 + } + ] + }, + { + "id": 43, + "seek": 5500, + "start": 75.92, + "end": 76.64, + "text": " No problem.", + "tokens": [ + 883, + 1154, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.32385124256408293, + "compression_ratio": 1.7088607594936709, + "no_speech_prob": 0.0003275917551945895, + "confidence": 0.56, + "words": [ + { + "text": "No", + "start": 75.92, + "end": 76.22, + "confidence": 0.366 + }, + { + "text": "problem.", + "start": 76.22, + "end": 76.64, + "confidence": 0.692 + } + ] + }, + { + "id": 44, + "seek": 5500, + "start": 76.66, + "end": 78.1, + "text": " We'll let you know when the end of...", + "tokens": [ + 492, + 603, + 718, + 291, + 458, + 562, + 264, + 917, + 295, + 485 + ], + "temperature": 0.0, + "avg_logprob": -0.32385124256408293, + "compression_ratio": 1.7088607594936709, + "no_speech_prob": 0.0003275917551945895, + "confidence": 0.367, + "words": [ + { + "text": "We'll", + "start": 76.66, + "end": 76.82, + "confidence": 0.091 + }, + { + "text": "let", + "start": 76.82, + "end": 77.04, + "confidence": 0.723 + }, + { + "text": "you", + "start": 77.04, + "end": 77.18, + "confidence": 0.296 + }, + { + "text": "know", + "start": 77.18, + "end": 77.26, + "confidence": 0.984 + }, + { + "text": "when", + "start": 77.26, + "end": 77.38, + "confidence": 0.596 + }, + { + "text": "the", + "start": 77.38, + "end": 77.44, + "confidence": 0.683 + }, + { + "text": "end", + "start": 77.44, + "end": 77.56, + "confidence": 0.937 + }, + { + "text": "of...", + "start": 77.56, + "end": 78.1, + "confidence": 0.257 + } + ] + }, + { + "id": 45, + "seek": 5500, + "start": 78.12, + "end": 78.34, + "text": " None.", + "tokens": [ + 14492, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.32385124256408293, + "compression_ratio": 1.7088607594936709, + "no_speech_prob": 0.0003275917551945895, + "confidence": 0.017, + "words": [ + { + "text": "None.", + "start": 78.12, + "end": 78.34, + "confidence": 0.017 + } + ] + }, + { + "id": 46, + "seek": 7900, + "start": 78.52, + "end": 82.18, + "text": " Okay.", + "tokens": [ + 50364, + 1033, + 13, + 50714 + ], + "temperature": 0.0, + "avg_logprob": -0.7262506484985352, + "compression_ratio": 0.38461538461538464, + "no_speech_prob": 0.0013847488444298506, + "confidence": 0.036, + "words": [ + { + "text": "Okay.", + "start": 78.52, + "end": 82.18, + "confidence": 0.036 + } + ] + } + ], + "language": "en" +} \ No newline at end of file diff --git a/tests/expected/naive.cpu/naive_apollo11.mp3.words.json b/tests/expected/naive.cpu/naive_apollo11.mp3.words.json new file mode 100644 index 0000000000000000000000000000000000000000..e4eef5136cb849167d2c3d19c38438515c0e4232 --- /dev/null +++ b/tests/expected/naive.cpu/naive_apollo11.mp3.words.json @@ -0,0 +1,3814 @@ +{ + "text": " Apollo 11, Houston we got a recommendation for you on your Soyuz-VA GLEME GVA. Alright, okay, we like to say that they make the one that's on the helmet we're going to have in B1. And you can put the other one on the mic helmet with those GVA blizzard frames. Alright, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them", + "segments": [ + { + "id": 0, + "seek": 0, + "start": 0.64, + "end": 6.68, + "text": " Apollo 11, Houston we got a recommendation for you on your Soyuz-VA GLEME GVA.", + "tokens": [ + 25187, + 2975, + 11, + 18717, + 321, + 658, + 257, + 11879, + 337, + 291, + 322, + 428, + 24758, + 3334, + 12, + 20914, + 460, + 2634, + 15454, + 460, + 20914, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.7224321867290296, + "compression_ratio": 1.39247311827957, + "no_speech_prob": 0.45045843720436096, + "confidence": 0.49, + "words": [ + { + "text": "Apollo", + "start": 0.64, + "end": 0.98, + "confidence": 0.426 + }, + { + "text": "11,", + "start": 0.98, + "end": 1.54, + "confidence": 0.842 + }, + { + "text": "Houston", + "start": 1.54, + "end": 1.8, + "confidence": 0.974 + }, + { + "text": "we", + "start": 1.8, + "end": 1.98, + "confidence": 0.453 + }, + { + "text": "got", + "start": 1.98, + "end": 2.16, + "confidence": 0.789 + }, + { + "text": "a", + "start": 2.16, + "end": 2.36, + "confidence": 0.992 + }, + { + "text": "recommendation", + "start": 2.36, + "end": 3.1, + "confidence": 0.971 + }, + { + "text": "for", + "start": 3.1, + "end": 3.54, + "confidence": 0.944 + }, + { + "text": "you", + "start": 3.54, + "end": 3.88, + "confidence": 0.99 + }, + { + "text": "on", + "start": 3.88, + "end": 4.26, + "confidence": 0.935 + }, + { + "text": "your", + "start": 4.26, + "end": 4.3, + "confidence": 0.974 + }, + { + "text": "Soyuz-VA", + "start": 4.3, + "end": 5.38, + "confidence": 0.325 + }, + { + "text": "GLEME", + "start": 5.38, + "end": 6.02, + "confidence": 0.171 + }, + { + "text": "GVA.", + "start": 6.02, + "end": 6.68, + "confidence": 0.318 + } + ] + }, + { + "id": 1, + "seek": 0, + "start": 6.7, + "end": 19.16, + "text": " Alright, okay, we like to say that they make the one that's on the helmet we're going to have in B1.", + "tokens": [ + 2798, + 11, + 1392, + 11, + 321, + 411, + 281, + 584, + 300, + 436, + 652, + 264, + 472, + 300, + 311, + 322, + 264, + 15922, + 321, + 434, + 516, + 281, + 362, + 294, + 363, + 16, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.7224321867290296, + "compression_ratio": 1.39247311827957, + "no_speech_prob": 0.45045843720436096, + "confidence": 0.324, + "words": [ + { + "text": "Alright,", + "start": 6.7, + "end": 12.02, + "confidence": 0.083 + }, + { + "text": "okay,", + "start": 12.02, + "end": 12.82, + "confidence": 0.321 + }, + { + "text": "we", + "start": 12.82, + "end": 13.04, + "confidence": 0.365 + }, + { + "text": "like", + "start": 13.04, + "end": 13.5, + "confidence": 0.475 + }, + { + "text": "to", + "start": 13.5, + "end": 13.68, + "confidence": 0.124 + }, + { + "text": "say", + "start": 13.68, + "end": 14.98, + "confidence": 0.127 + }, + { + "text": "that", + "start": 14.98, + "end": 15.56, + "confidence": 0.244 + }, + { + "text": "they", + "start": 15.56, + "end": 15.6, + "confidence": 0.387 + }, + { + "text": "make", + "start": 15.6, + "end": 15.78, + "confidence": 0.155 + }, + { + "text": "the", + "start": 15.78, + "end": 15.92, + "confidence": 0.172 + }, + { + "text": "one", + "start": 15.92, + "end": 16.1, + "confidence": 0.507 + }, + { + "text": "that's", + "start": 16.1, + "end": 16.36, + "confidence": 0.385 + }, + { + "text": "on", + "start": 16.36, + "end": 16.6, + "confidence": 0.324 + }, + { + "text": "the", + "start": 16.6, + "end": 16.84, + "confidence": 0.35 + }, + { + "text": "helmet", + "start": 16.84, + "end": 17.36, + "confidence": 0.218 + }, + { + "text": "we're", + "start": 17.36, + "end": 17.86, + "confidence": 0.361 + }, + { + "text": "going", + "start": 17.86, + "end": 18.06, + "confidence": 0.435 + }, + { + "text": "to", + "start": 18.06, + "end": 18.22, + "confidence": 0.496 + }, + { + "text": "have", + "start": 18.22, + "end": 18.26, + "confidence": 0.831 + }, + { + "text": "in", + "start": 18.26, + "end": 18.48, + "confidence": 0.761 + }, + { + "text": "B1.", + "start": 18.48, + "end": 19.16, + "confidence": 0.731 + } + ] + }, + { + "id": 2, + "seek": 0, + "start": 20.12, + "end": 24.64, + "text": " And you can put the other one on the mic helmet with those GVA blizzard frames.", + "tokens": [ + 400, + 291, + 393, + 829, + 264, + 661, + 472, + 322, + 264, + 3123, + 15922, + 365, + 729, + 460, + 20914, + 888, + 31062, + 12083, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.7224321867290296, + "compression_ratio": 1.39247311827957, + "no_speech_prob": 0.45045843720436096, + "confidence": 0.119, + "words": [ + { + "text": "And", + "start": 20.12, + "end": 20.16, + "confidence": 0.27 + }, + { + "text": "you", + "start": 20.16, + "end": 20.36, + "confidence": 0.884 + }, + { + "text": "can", + "start": 20.36, + "end": 20.54, + "confidence": 0.388 + }, + { + "text": "put", + "start": 20.54, + "end": 20.72, + "confidence": 0.929 + }, + { + "text": "the", + "start": 20.72, + "end": 20.9, + "confidence": 0.98 + }, + { + "text": "other", + "start": 20.9, + "end": 21.06, + "confidence": 0.995 + }, + { + "text": "one", + "start": 21.06, + "end": 21.26, + "confidence": 0.964 + }, + { + "text": "on", + "start": 21.26, + "end": 21.8, + "confidence": 0.962 + }, + { + "text": "the", + "start": 21.8, + "end": 21.84, + "confidence": 0.185 + }, + { + "text": "mic", + "start": 21.84, + "end": 22.6, + "confidence": 0.682 + }, + { + "text": "helmet", + "start": 22.6, + "end": 22.96, + "confidence": 0.011 + }, + { + "text": "with", + "start": 22.96, + "end": 23.2, + "confidence": 0.055 + }, + { + "text": "those", + "start": 23.2, + "end": 23.46, + "confidence": 0.084 + }, + { + "text": "GVA", + "start": 23.46, + "end": 23.88, + "confidence": 0.0 + }, + { + "text": "blizzard", + "start": 23.88, + "end": 24.36, + "confidence": 0.026 + }, + { + "text": "frames.", + "start": 24.36, + "end": 24.64, + "confidence": 0.179 + } + ] + }, + { + "id": 3, + "seek": 2500, + "start": 24.86, + "end": 54.62, + "text": " Alright, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them", + "tokens": [ + 50364, + 2798, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552 + ], + "temperature": 0.0, + "avg_logprob": -0.1079042222764757, + "compression_ratio": 24.096774193548388, + "no_speech_prob": 0.00111382023897022, + "confidence": 0.887, + "words": [ + { + "text": "Alright,", + "start": 24.86, + "end": 32.0, + "confidence": 0.092 + }, + { + "text": "got", + "start": 32.0, + "end": 32.04, + "confidence": 0.107 + }, + { + "text": "them,", + "start": 32.04, + "end": 32.58, + "confidence": 0.194 + }, + { + "text": "got", + "start": 32.58, + "end": 33.06, + "confidence": 0.39 + }, + { + "text": "them,", + "start": 33.06, + "end": 33.78, + "confidence": 0.616 + }, + { + "text": "got", + "start": 33.78, + "end": 33.82, + "confidence": 0.641 + }, + { + "text": "them,", + "start": 33.82, + "end": 34.52, + "confidence": 0.506 + }, + { + "text": "got", + "start": 34.52, + "end": 34.74, + "confidence": 0.662 + }, + { + "text": "them,", + "start": 34.74, + "end": 34.78, + "confidence": 0.507 + }, + { + "text": "got", + "start": 34.78, + "end": 35.02, + "confidence": 0.754 + }, + { + "text": "them,", + "start": 35.02, + "end": 35.06, + "confidence": 0.589 + }, + { + "text": "got", + "start": 35.06, + "end": 35.1, + "confidence": 0.779 + }, + { + "text": "them,", + "start": 35.1, + "end": 35.14, + "confidence": 0.705 + }, + { + "text": "got", + "start": 35.14, + "end": 35.34, + "confidence": 0.86 + }, + { + "text": "them,", + "start": 35.34, + "end": 35.98, + "confidence": 0.82 + }, + { + "text": "got", + "start": 35.98, + "end": 36.02, + "confidence": 0.916 + }, + { + "text": "them,", + "start": 36.02, + "end": 36.06, + "confidence": 0.76 + }, + { + "text": "got", + "start": 36.06, + "end": 36.1, + "confidence": 0.479 + }, + { + "text": "them,", + "start": 36.1, + "end": 36.14, + "confidence": 0.846 + }, + { + "text": "got", + "start": 36.14, + "end": 36.18, + "confidence": 0.916 + }, + { + "text": "them,", + "start": 36.18, + "end": 36.22, + "confidence": 0.89 + }, + { + "text": "got", + "start": 36.22, + "end": 36.26, + "confidence": 0.928 + }, + { + "text": "them,", + "start": 36.26, + "end": 36.3, + "confidence": 0.903 + }, + { + "text": "got", + "start": 36.3, + "end": 36.34, + "confidence": 0.932 + }, + { + "text": "them,", + "start": 36.34, + "end": 36.38, + "confidence": 0.91 + }, + { + "text": "got", + "start": 36.38, + "end": 36.42, + "confidence": 0.944 + }, + { + "text": "them,", + "start": 36.42, + "end": 36.46, + "confidence": 0.904 + }, + { + "text": "got", + "start": 36.46, + "end": 36.5, + "confidence": 0.942 + }, + { + "text": "them,", + "start": 36.5, + "end": 36.54, + "confidence": 0.903 + }, + { + "text": "got", + "start": 36.54, + "end": 36.58, + "confidence": 0.935 + }, + { + "text": "them,", + "start": 36.58, + "end": 36.62, + "confidence": 0.912 + }, + { + "text": "got", + "start": 36.62, + "end": 36.66, + "confidence": 0.93 + }, + { + "text": "them,", + "start": 36.66, + "end": 36.7, + "confidence": 0.918 + }, + { + "text": "got", + "start": 36.7, + "end": 36.74, + "confidence": 0.93 + }, + { + "text": "them,", + "start": 36.74, + "end": 36.78, + "confidence": 0.923 + }, + { + "text": "got", + "start": 36.78, + "end": 36.82, + "confidence": 0.936 + }, + { + "text": "them,", + "start": 36.82, + "end": 36.86, + "confidence": 0.93 + }, + { + "text": "got", + "start": 36.86, + "end": 36.9, + "confidence": 0.938 + }, + { + "text": "them,", + "start": 36.9, + "end": 36.94, + "confidence": 0.937 + }, + { + "text": "got", + "start": 36.94, + "end": 36.98, + "confidence": 0.944 + }, + { + "text": "them,", + "start": 36.98, + "end": 37.02, + "confidence": 0.942 + }, + { + "text": "got", + "start": 37.02, + "end": 37.06, + "confidence": 0.946 + }, + { + "text": "them,", + "start": 37.06, + "end": 37.1, + "confidence": 0.945 + }, + { + "text": "got", + "start": 37.1, + "end": 37.14, + "confidence": 0.949 + }, + { + "text": "them,", + "start": 37.14, + "end": 37.18, + "confidence": 0.948 + }, + { + "text": "got", + "start": 37.18, + "end": 37.22, + "confidence": 0.95 + }, + { + "text": "them,", + "start": 37.22, + "end": 37.26, + "confidence": 0.951 + }, + { + "text": "got", + "start": 37.26, + "end": 37.3, + "confidence": 0.952 + }, + { + "text": "them,", + "start": 37.3, + "end": 37.34, + "confidence": 0.953 + }, + { + "text": "got", + "start": 37.34, + "end": 37.38, + "confidence": 0.953 + }, + { + "text": "them,", + "start": 37.38, + "end": 37.42, + "confidence": 0.956 + }, + { + "text": "got", + "start": 37.42, + "end": 37.46, + "confidence": 0.953 + }, + { + "text": "them,", + "start": 37.46, + "end": 37.5, + "confidence": 0.957 + }, + { + "text": "got", + "start": 37.5, + "end": 37.54, + "confidence": 0.955 + }, + { + "text": "them,", + "start": 37.54, + "end": 37.58, + "confidence": 0.958 + }, + { + "text": "got", + "start": 37.58, + "end": 37.62, + "confidence": 0.956 + }, + { + "text": "them,", + "start": 37.62, + "end": 37.66, + "confidence": 0.961 + }, + { + "text": "got", + "start": 37.66, + "end": 37.7, + "confidence": 0.956 + }, + { + "text": "them,", + "start": 37.7, + "end": 37.74, + "confidence": 0.961 + }, + { + "text": "got", + "start": 37.74, + "end": 37.78, + "confidence": 0.957 + }, + { + "text": "them,", + "start": 37.78, + "end": 37.82, + "confidence": 0.962 + }, + { + "text": "got", + "start": 37.82, + "end": 37.86, + "confidence": 0.957 + }, + { + "text": "them,", + "start": 37.86, + "end": 37.9, + "confidence": 0.964 + }, + { + "text": "got", + "start": 37.9, + "end": 37.94, + "confidence": 0.958 + }, + { + "text": "them,", + "start": 37.94, + "end": 37.98, + "confidence": 0.965 + }, + { + "text": "got", + "start": 37.98, + "end": 38.02, + "confidence": 0.959 + }, + { + "text": "them,", + "start": 38.02, + "end": 38.06, + "confidence": 0.966 + }, + { + "text": "got", + "start": 38.06, + "end": 38.1, + "confidence": 0.961 + }, + { + "text": "them,", + "start": 38.1, + "end": 38.14, + "confidence": 0.968 + }, + { + "text": "got", + "start": 38.14, + "end": 38.18, + "confidence": 0.963 + }, + { + "text": "them,", + "start": 38.18, + "end": 38.22, + "confidence": 0.969 + }, + { + "text": "got", + "start": 38.22, + "end": 38.26, + "confidence": 0.963 + }, + { + "text": "them,", + "start": 38.26, + "end": 38.3, + "confidence": 0.968 + }, + { + "text": "got", + "start": 38.3, + "end": 38.34, + "confidence": 0.964 + }, + { + "text": "them,", + "start": 38.34, + "end": 38.38, + "confidence": 0.971 + }, + { + "text": "got", + "start": 38.38, + "end": 38.42, + "confidence": 0.967 + }, + { + "text": "them,", + "start": 38.42, + "end": 38.46, + "confidence": 0.972 + }, + { + "text": "got", + "start": 38.46, + "end": 38.5, + "confidence": 0.968 + }, + { + "text": "them,", + "start": 38.5, + "end": 38.54, + "confidence": 0.974 + }, + { + "text": "got", + "start": 38.54, + "end": 38.58, + "confidence": 0.969 + }, + { + "text": "them,", + "start": 38.58, + "end": 38.62, + "confidence": 0.974 + }, + { + "text": "got", + "start": 38.62, + "end": 38.66, + "confidence": 0.971 + }, + { + "text": "them,", + "start": 38.66, + "end": 38.7, + "confidence": 0.974 + }, + { + "text": "got", + "start": 38.7, + "end": 38.74, + "confidence": 0.974 + }, + { + "text": "them,", + "start": 38.74, + "end": 38.78, + "confidence": 0.976 + }, + { + "text": "got", + "start": 38.78, + "end": 38.82, + "confidence": 0.976 + }, + { + "text": "them,", + "start": 38.82, + "end": 38.86, + "confidence": 0.977 + }, + { + "text": "got", + "start": 38.86, + "end": 38.9, + "confidence": 0.977 + }, + { + "text": "them,", + "start": 38.9, + "end": 38.94, + "confidence": 0.978 + }, + { + "text": "got", + "start": 38.94, + "end": 38.98, + "confidence": 0.978 + }, + { + "text": "them,", + "start": 38.98, + "end": 39.02, + "confidence": 0.978 + }, + { + "text": "got", + "start": 39.02, + "end": 39.06, + "confidence": 0.98 + }, + { + "text": "them,", + "start": 39.06, + "end": 39.1, + "confidence": 0.979 + }, + { + "text": "got", + "start": 39.1, + "end": 39.14, + "confidence": 0.982 + }, + { + "text": "them,", + "start": 39.14, + "end": 39.18, + "confidence": 0.981 + }, + { + "text": "got", + "start": 39.18, + "end": 39.22, + "confidence": 0.984 + }, + { + "text": "them,", + "start": 39.22, + "end": 39.26, + "confidence": 0.982 + }, + { + "text": "got", + "start": 39.26, + "end": 39.3, + "confidence": 0.984 + }, + { + "text": "them,", + "start": 39.3, + "end": 39.34, + "confidence": 0.982 + }, + { + "text": "got", + "start": 39.34, + "end": 39.38, + "confidence": 0.986 + }, + { + "text": "them,", + "start": 39.38, + "end": 39.42, + "confidence": 0.983 + }, + { + "text": "got", + "start": 39.42, + "end": 39.46, + "confidence": 0.988 + }, + { + "text": "them,", + "start": 39.46, + "end": 39.5, + "confidence": 0.982 + }, + { + "text": "got", + "start": 39.5, + "end": 39.54, + "confidence": 0.989 + }, + { + "text": "them,", + "start": 39.54, + "end": 39.58, + "confidence": 0.983 + }, + { + "text": "got", + "start": 39.58, + "end": 39.62, + "confidence": 0.99 + }, + { + "text": "them,", + "start": 39.62, + "end": 39.66, + "confidence": 0.984 + }, + { + "text": "got", + "start": 39.66, + "end": 39.7, + "confidence": 0.99 + }, + { + "text": "them,", + "start": 39.7, + "end": 39.74, + "confidence": 0.985 + }, + { + "text": "got", + "start": 39.74, + "end": 39.78, + "confidence": 0.991 + }, + { + "text": "them,", + "start": 39.78, + "end": 39.82, + "confidence": 0.985 + }, + { + "text": "got", + "start": 39.82, + "end": 39.86, + "confidence": 0.991 + }, + { + "text": "them,", + "start": 39.86, + "end": 39.9, + "confidence": 0.985 + }, + { + "text": "got", + "start": 39.9, + "end": 39.94, + "confidence": 0.992 + }, + { + "text": "them,", + "start": 39.94, + "end": 39.98, + "confidence": 0.985 + }, + { + "text": "got", + "start": 39.98, + "end": 40.02, + "confidence": 0.992 + }, + { + "text": "them,", + "start": 40.02, + "end": 40.06, + "confidence": 0.986 + }, + { + "text": "got", + "start": 40.06, + "end": 40.1, + "confidence": 0.993 + }, + { + "text": "them,", + "start": 40.1, + "end": 40.14, + "confidence": 0.986 + }, + { + "text": "got", + "start": 40.14, + "end": 40.18, + "confidence": 0.993 + }, + { + "text": "them,", + "start": 40.18, + "end": 40.22, + "confidence": 0.987 + }, + { + "text": "got", + "start": 40.22, + "end": 40.26, + "confidence": 0.993 + }, + { + "text": "them,", + "start": 40.26, + "end": 40.3, + "confidence": 0.987 + }, + { + "text": "got", + "start": 40.3, + "end": 40.34, + "confidence": 0.994 + }, + { + "text": "them,", + "start": 40.34, + "end": 40.38, + "confidence": 0.987 + }, + { + "text": "got", + "start": 40.38, + "end": 40.42, + "confidence": 0.994 + }, + { + "text": "them,", + "start": 40.42, + "end": 40.46, + "confidence": 0.987 + }, + { + "text": "got", + "start": 40.46, + "end": 40.5, + "confidence": 0.994 + }, + { + "text": "them,", + "start": 40.5, + "end": 40.54, + "confidence": 0.986 + }, + { + "text": "got", + "start": 40.54, + "end": 40.58, + "confidence": 0.995 + }, + { + "text": "them,", + "start": 40.58, + "end": 40.76, + "confidence": 0.988 + }, + { + "text": "got", + "start": 40.76, + "end": 40.8, + "confidence": 0.994 + }, + { + "text": "them,", + "start": 40.8, + "end": 40.84, + "confidence": 0.988 + }, + { + "text": "got", + "start": 40.84, + "end": 40.88, + "confidence": 0.995 + }, + { + "text": "them,", + "start": 40.88, + "end": 40.92, + "confidence": 0.989 + }, + { + "text": "got", + "start": 40.92, + "end": 40.96, + "confidence": 0.995 + }, + { + "text": "them,", + "start": 40.96, + "end": 41.0, + "confidence": 0.989 + }, + { + "text": "got", + "start": 41.0, + "end": 41.04, + "confidence": 0.995 + }, + { + "text": "them,", + "start": 41.04, + "end": 41.08, + "confidence": 0.989 + }, + { + "text": "got", + "start": 41.08, + "end": 41.12, + "confidence": 0.995 + }, + { + "text": "them,", + "start": 41.12, + "end": 42.32, + "confidence": 0.989 + }, + { + "text": "got", + "start": 42.32, + "end": 42.68, + "confidence": 0.995 + }, + { + "text": "them,", + "start": 42.68, + "end": 42.9, + "confidence": 0.989 + }, + { + "text": "got", + "start": 42.9, + "end": 44.08, + "confidence": 0.995 + }, + { + "text": "them,", + "start": 44.08, + "end": 44.96, + "confidence": 0.989 + }, + { + "text": "got", + "start": 44.96, + "end": 46.9, + "confidence": 0.995 + }, + { + "text": "them,", + "start": 46.9, + "end": 47.82, + "confidence": 0.989 + }, + { + "text": "got", + "start": 47.82, + "end": 48.56, + "confidence": 0.994 + }, + { + "text": "them", + "start": 48.56, + "end": 54.62, + "confidence": 0.996 + } + ] + }, + { + "id": 4, + "seek": 5500, + "start": 54.64, + "end": 84.6, + "text": " got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them", + "tokens": [ + 50364, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552 + ], + "temperature": 0.0, + "avg_logprob": -0.053046889369263245, + "compression_ratio": 29.52, + "no_speech_prob": 0.24410122632980347, + "confidence": 0.839, + "words": [ + { + "text": "got", + "start": 54.64, + "end": 54.82, + "confidence": 0.004 + }, + { + "text": "them,", + "start": 54.82, + "end": 56.36, + "confidence": 0.007 + }, + { + "text": "got", + "start": 56.36, + "end": 58.46, + "confidence": 0.037 + }, + { + "text": "them,", + "start": 58.46, + "end": 59.7, + "confidence": 0.349 + }, + { + "text": "got", + "start": 59.7, + "end": 60.0, + "confidence": 0.616 + }, + { + "text": "them,", + "start": 60.0, + "end": 60.04, + "confidence": 0.574 + }, + { + "text": "got", + "start": 60.04, + "end": 60.08, + "confidence": 0.808 + }, + { + "text": "them,", + "start": 60.08, + "end": 60.12, + "confidence": 0.636 + }, + { + "text": "got", + "start": 60.12, + "end": 60.16, + "confidence": 0.875 + }, + { + "text": "them,", + "start": 60.16, + "end": 60.2, + "confidence": 0.676 + }, + { + "text": "got", + "start": 60.2, + "end": 60.24, + "confidence": 0.9 + }, + { + "text": "them,", + "start": 60.24, + "end": 60.42, + "confidence": 0.689 + }, + { + "text": "got", + "start": 60.42, + "end": 60.46, + "confidence": 0.871 + }, + { + "text": "them,", + "start": 60.46, + "end": 60.5, + "confidence": 0.757 + }, + { + "text": "got", + "start": 60.5, + "end": 60.62, + "confidence": 0.904 + }, + { + "text": "them,", + "start": 60.62, + "end": 61.78, + "confidence": 0.825 + }, + { + "text": "got", + "start": 61.78, + "end": 61.82, + "confidence": 0.926 + }, + { + "text": "them,", + "start": 61.82, + "end": 61.86, + "confidence": 0.58 + }, + { + "text": "got", + "start": 61.86, + "end": 61.9, + "confidence": 0.123 + }, + { + "text": "them,", + "start": 61.9, + "end": 61.94, + "confidence": 0.75 + }, + { + "text": "got", + "start": 61.94, + "end": 61.98, + "confidence": 0.772 + }, + { + "text": "them,", + "start": 61.98, + "end": 62.02, + "confidence": 0.81 + }, + { + "text": "got", + "start": 62.02, + "end": 62.06, + "confidence": 0.808 + }, + { + "text": "them,", + "start": 62.06, + "end": 62.1, + "confidence": 0.828 + }, + { + "text": "got", + "start": 62.1, + "end": 62.14, + "confidence": 0.82 + }, + { + "text": "them,", + "start": 62.14, + "end": 62.18, + "confidence": 0.852 + }, + { + "text": "got", + "start": 62.18, + "end": 62.22, + "confidence": 0.858 + }, + { + "text": "them,", + "start": 62.22, + "end": 62.26, + "confidence": 0.886 + }, + { + "text": "got", + "start": 62.26, + "end": 62.3, + "confidence": 0.899 + }, + { + "text": "them,", + "start": 62.3, + "end": 62.34, + "confidence": 0.901 + }, + { + "text": "got", + "start": 62.34, + "end": 62.38, + "confidence": 0.89 + }, + { + "text": "them,", + "start": 62.38, + "end": 62.42, + "confidence": 0.905 + }, + { + "text": "got", + "start": 62.42, + "end": 62.46, + "confidence": 0.868 + }, + { + "text": "them,", + "start": 62.46, + "end": 62.5, + "confidence": 0.919 + }, + { + "text": "got", + "start": 62.5, + "end": 62.54, + "confidence": 0.881 + }, + { + "text": "them,", + "start": 62.54, + "end": 62.58, + "confidence": 0.929 + }, + { + "text": "got", + "start": 62.58, + "end": 62.62, + "confidence": 0.893 + }, + { + "text": "them,", + "start": 62.62, + "end": 62.66, + "confidence": 0.938 + }, + { + "text": "got", + "start": 62.66, + "end": 62.7, + "confidence": 0.906 + }, + { + "text": "them,", + "start": 62.7, + "end": 62.74, + "confidence": 0.943 + }, + { + "text": "got", + "start": 62.74, + "end": 62.78, + "confidence": 0.913 + }, + { + "text": "them,", + "start": 62.78, + "end": 62.82, + "confidence": 0.949 + }, + { + "text": "got", + "start": 62.82, + "end": 62.86, + "confidence": 0.919 + }, + { + "text": "them,", + "start": 62.86, + "end": 62.9, + "confidence": 0.952 + }, + { + "text": "got", + "start": 62.9, + "end": 62.94, + "confidence": 0.926 + }, + { + "text": "them,", + "start": 62.94, + "end": 62.98, + "confidence": 0.956 + }, + { + "text": "got", + "start": 62.98, + "end": 63.02, + "confidence": 0.932 + }, + { + "text": "them,", + "start": 63.02, + "end": 63.06, + "confidence": 0.958 + }, + { + "text": "got", + "start": 63.06, + "end": 63.1, + "confidence": 0.936 + }, + { + "text": "them,", + "start": 63.1, + "end": 63.14, + "confidence": 0.961 + }, + { + "text": "got", + "start": 63.14, + "end": 63.18, + "confidence": 0.938 + }, + { + "text": "them,", + "start": 63.18, + "end": 63.22, + "confidence": 0.964 + }, + { + "text": "got", + "start": 63.22, + "end": 63.26, + "confidence": 0.939 + }, + { + "text": "them,", + "start": 63.26, + "end": 63.3, + "confidence": 0.964 + }, + { + "text": "got", + "start": 63.3, + "end": 63.34, + "confidence": 0.941 + }, + { + "text": "them,", + "start": 63.34, + "end": 63.38, + "confidence": 0.965 + }, + { + "text": "got", + "start": 63.38, + "end": 63.42, + "confidence": 0.943 + }, + { + "text": "them,", + "start": 63.42, + "end": 63.46, + "confidence": 0.967 + }, + { + "text": "got", + "start": 63.46, + "end": 63.5, + "confidence": 0.944 + }, + { + "text": "them,", + "start": 63.5, + "end": 63.54, + "confidence": 0.968 + }, + { + "text": "got", + "start": 63.54, + "end": 63.58, + "confidence": 0.945 + }, + { + "text": "them,", + "start": 63.58, + "end": 63.62, + "confidence": 0.968 + }, + { + "text": "got", + "start": 63.62, + "end": 63.66, + "confidence": 0.947 + }, + { + "text": "them,", + "start": 63.66, + "end": 63.7, + "confidence": 0.97 + }, + { + "text": "got", + "start": 63.7, + "end": 63.74, + "confidence": 0.947 + }, + { + "text": "them,", + "start": 63.74, + "end": 63.78, + "confidence": 0.971 + }, + { + "text": "got", + "start": 63.78, + "end": 63.82, + "confidence": 0.949 + }, + { + "text": "them,", + "start": 63.82, + "end": 63.86, + "confidence": 0.971 + }, + { + "text": "got", + "start": 63.86, + "end": 63.9, + "confidence": 0.95 + }, + { + "text": "them,", + "start": 63.9, + "end": 63.94, + "confidence": 0.971 + }, + { + "text": "got", + "start": 63.94, + "end": 63.98, + "confidence": 0.952 + }, + { + "text": "them,", + "start": 63.98, + "end": 64.02, + "confidence": 0.97 + }, + { + "text": "got", + "start": 64.02, + "end": 64.06, + "confidence": 0.953 + }, + { + "text": "them,", + "start": 64.06, + "end": 64.1, + "confidence": 0.972 + }, + { + "text": "got", + "start": 64.1, + "end": 64.14, + "confidence": 0.955 + }, + { + "text": "them,", + "start": 64.14, + "end": 64.18, + "confidence": 0.972 + }, + { + "text": "got", + "start": 64.18, + "end": 64.22, + "confidence": 0.957 + }, + { + "text": "them,", + "start": 64.22, + "end": 64.26, + "confidence": 0.973 + }, + { + "text": "got", + "start": 64.26, + "end": 64.3, + "confidence": 0.958 + }, + { + "text": "them,", + "start": 64.3, + "end": 64.34, + "confidence": 0.974 + }, + { + "text": "got", + "start": 64.34, + "end": 64.38, + "confidence": 0.959 + }, + { + "text": "them,", + "start": 64.38, + "end": 64.42, + "confidence": 0.974 + }, + { + "text": "got", + "start": 64.42, + "end": 64.46, + "confidence": 0.961 + }, + { + "text": "them,", + "start": 64.46, + "end": 64.5, + "confidence": 0.974 + }, + { + "text": "got", + "start": 64.5, + "end": 64.54, + "confidence": 0.964 + }, + { + "text": "them,", + "start": 64.54, + "end": 64.58, + "confidence": 0.974 + }, + { + "text": "got", + "start": 64.58, + "end": 64.62, + "confidence": 0.965 + }, + { + "text": "them,", + "start": 64.62, + "end": 64.66, + "confidence": 0.975 + }, + { + "text": "got", + "start": 64.66, + "end": 64.7, + "confidence": 0.967 + }, + { + "text": "them,", + "start": 64.7, + "end": 64.74, + "confidence": 0.975 + }, + { + "text": "got", + "start": 64.74, + "end": 64.78, + "confidence": 0.97 + }, + { + "text": "them,", + "start": 64.78, + "end": 64.82, + "confidence": 0.977 + }, + { + "text": "got", + "start": 64.82, + "end": 64.86, + "confidence": 0.971 + }, + { + "text": "them,", + "start": 64.86, + "end": 64.9, + "confidence": 0.977 + }, + { + "text": "got", + "start": 64.9, + "end": 64.94, + "confidence": 0.973 + }, + { + "text": "them,", + "start": 64.94, + "end": 64.98, + "confidence": 0.976 + }, + { + "text": "got", + "start": 64.98, + "end": 65.02, + "confidence": 0.975 + }, + { + "text": "them,", + "start": 65.02, + "end": 65.06, + "confidence": 0.976 + }, + { + "text": "got", + "start": 65.06, + "end": 65.1, + "confidence": 0.976 + }, + { + "text": "them,", + "start": 65.1, + "end": 65.14, + "confidence": 0.978 + }, + { + "text": "got", + "start": 65.14, + "end": 65.18, + "confidence": 0.978 + }, + { + "text": "them,", + "start": 65.18, + "end": 65.22, + "confidence": 0.978 + }, + { + "text": "got", + "start": 65.22, + "end": 65.26, + "confidence": 0.978 + }, + { + "text": "them,", + "start": 65.26, + "end": 65.3, + "confidence": 0.979 + }, + { + "text": "got", + "start": 65.3, + "end": 65.34, + "confidence": 0.98 + }, + { + "text": "them,", + "start": 65.34, + "end": 65.38, + "confidence": 0.979 + }, + { + "text": "got", + "start": 65.38, + "end": 65.42, + "confidence": 0.981 + }, + { + "text": "them,", + "start": 65.42, + "end": 65.46, + "confidence": 0.978 + }, + { + "text": "got", + "start": 65.46, + "end": 65.5, + "confidence": 0.982 + }, + { + "text": "them,", + "start": 65.5, + "end": 65.54, + "confidence": 0.98 + }, + { + "text": "got", + "start": 65.54, + "end": 65.58, + "confidence": 0.983 + }, + { + "text": "them,", + "start": 65.58, + "end": 65.62, + "confidence": 0.979 + }, + { + "text": "got", + "start": 65.62, + "end": 65.66, + "confidence": 0.984 + }, + { + "text": "them,", + "start": 65.66, + "end": 65.7, + "confidence": 0.98 + }, + { + "text": "got", + "start": 65.7, + "end": 65.74, + "confidence": 0.985 + }, + { + "text": "them,", + "start": 65.74, + "end": 65.78, + "confidence": 0.98 + }, + { + "text": "got", + "start": 65.78, + "end": 65.82, + "confidence": 0.986 + }, + { + "text": "them,", + "start": 65.82, + "end": 65.86, + "confidence": 0.981 + }, + { + "text": "got", + "start": 65.86, + "end": 65.9, + "confidence": 0.986 + }, + { + "text": "them,", + "start": 65.9, + "end": 65.94, + "confidence": 0.98 + }, + { + "text": "got", + "start": 65.94, + "end": 65.98, + "confidence": 0.987 + }, + { + "text": "them,", + "start": 65.98, + "end": 66.02, + "confidence": 0.982 + }, + { + "text": "got", + "start": 66.02, + "end": 66.3, + "confidence": 0.987 + }, + { + "text": "them,", + "start": 66.3, + "end": 66.34, + "confidence": 0.982 + }, + { + "text": "got", + "start": 66.34, + "end": 66.54, + "confidence": 0.987 + }, + { + "text": "them,", + "start": 66.54, + "end": 66.58, + "confidence": 0.982 + }, + { + "text": "got", + "start": 66.58, + "end": 66.62, + "confidence": 0.988 + }, + { + "text": "them,", + "start": 66.62, + "end": 66.66, + "confidence": 0.981 + }, + { + "text": "got", + "start": 66.66, + "end": 67.38, + "confidence": 0.989 + }, + { + "text": "them,", + "start": 67.38, + "end": 67.42, + "confidence": 0.982 + }, + { + "text": "got", + "start": 67.42, + "end": 67.46, + "confidence": 0.989 + }, + { + "text": "them,", + "start": 67.46, + "end": 67.5, + "confidence": 0.982 + }, + { + "text": "got", + "start": 67.5, + "end": 67.54, + "confidence": 0.99 + }, + { + "text": "them,", + "start": 67.54, + "end": 67.72, + "confidence": 0.983 + }, + { + "text": "got", + "start": 67.72, + "end": 67.76, + "confidence": 0.99 + }, + { + "text": "them,", + "start": 67.76, + "end": 67.8, + "confidence": 0.984 + }, + { + "text": "got", + "start": 67.8, + "end": 68.9, + "confidence": 0.991 + }, + { + "text": "them,", + "start": 68.9, + "end": 69.8, + "confidence": 0.983 + }, + { + "text": "got", + "start": 69.8, + "end": 70.66, + "confidence": 0.992 + }, + { + "text": "them,", + "start": 70.66, + "end": 70.94, + "confidence": 0.985 + }, + { + "text": "got", + "start": 70.94, + "end": 71.08, + "confidence": 0.992 + }, + { + "text": "them,", + "start": 71.08, + "end": 72.02, + "confidence": 0.984 + }, + { + "text": "got", + "start": 72.02, + "end": 72.08, + "confidence": 0.992 + }, + { + "text": "them,", + "start": 72.08, + "end": 72.84, + "confidence": 0.984 + }, + { + "text": "got", + "start": 72.84, + "end": 77.32, + "confidence": 0.992 + }, + { + "text": "them,", + "start": 77.32, + "end": 79.8, + "confidence": 0.985 + }, + { + "text": "got", + "start": 79.8, + "end": 79.84, + "confidence": 0.992 + }, + { + "text": "them", + "start": 79.84, + "end": 84.6, + "confidence": 0.994 + } + ] + }, + { + "id": 5, + "seek": 8500, + "start": 85.24, + "end": 91.16, + "text": " got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them", + "tokens": [ + 50364, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552 + ], + "temperature": 0.0, + "avg_logprob": -0.04965524716227578, + "compression_ratio": 29.52, + "no_speech_prob": 0.6971923112869263, + "confidence": 0.851, + "words": [ + { + "text": "got", + "start": 85.24, + "end": 85.28, + "confidence": 0.0 + }, + { + "text": "them,", + "start": 85.28, + "end": 85.32, + "confidence": 0.024 + }, + { + "text": "got", + "start": 85.32, + "end": 85.36, + "confidence": 0.839 + }, + { + "text": "them,", + "start": 85.36, + "end": 85.4, + "confidence": 0.564 + }, + { + "text": "got", + "start": 85.4, + "end": 85.44, + "confidence": 0.755 + }, + { + "text": "them,", + "start": 85.44, + "end": 85.48, + "confidence": 0.442 + }, + { + "text": "got", + "start": 85.48, + "end": 85.52, + "confidence": 0.859 + }, + { + "text": "them,", + "start": 85.52, + "end": 85.56, + "confidence": 0.389 + }, + { + "text": "got", + "start": 85.56, + "end": 85.6, + "confidence": 0.895 + }, + { + "text": "them,", + "start": 85.6, + "end": 85.64, + "confidence": 0.376 + }, + { + "text": "got", + "start": 85.64, + "end": 85.68, + "confidence": 0.896 + }, + { + "text": "them,", + "start": 85.68, + "end": 85.72, + "confidence": 0.39 + }, + { + "text": "got", + "start": 85.72, + "end": 85.76, + "confidence": 0.871 + }, + { + "text": "them,", + "start": 85.76, + "end": 85.8, + "confidence": 0.468 + }, + { + "text": "got", + "start": 85.8, + "end": 85.84, + "confidence": 0.894 + }, + { + "text": "them,", + "start": 85.84, + "end": 85.88, + "confidence": 0.576 + }, + { + "text": "got", + "start": 85.88, + "end": 85.92, + "confidence": 0.914 + }, + { + "text": "them,", + "start": 85.92, + "end": 85.96, + "confidence": 0.645 + }, + { + "text": "got", + "start": 85.96, + "end": 86.0, + "confidence": 0.633 + }, + { + "text": "them,", + "start": 86.0, + "end": 86.04, + "confidence": 0.746 + }, + { + "text": "got", + "start": 86.04, + "end": 86.08, + "confidence": 0.829 + }, + { + "text": "them,", + "start": 86.08, + "end": 86.12, + "confidence": 0.842 + }, + { + "text": "got", + "start": 86.12, + "end": 86.16, + "confidence": 0.906 + }, + { + "text": "them,", + "start": 86.16, + "end": 86.2, + "confidence": 0.89 + }, + { + "text": "got", + "start": 86.2, + "end": 86.24, + "confidence": 0.924 + }, + { + "text": "them,", + "start": 86.24, + "end": 86.28, + "confidence": 0.916 + }, + { + "text": "got", + "start": 86.28, + "end": 86.32, + "confidence": 0.94 + }, + { + "text": "them,", + "start": 86.32, + "end": 86.36, + "confidence": 0.934 + }, + { + "text": "got", + "start": 86.36, + "end": 86.4, + "confidence": 0.95 + }, + { + "text": "them,", + "start": 86.4, + "end": 86.44, + "confidence": 0.946 + }, + { + "text": "got", + "start": 86.44, + "end": 86.48, + "confidence": 0.954 + }, + { + "text": "them,", + "start": 86.48, + "end": 86.52, + "confidence": 0.946 + }, + { + "text": "got", + "start": 86.52, + "end": 86.56, + "confidence": 0.955 + }, + { + "text": "them,", + "start": 86.56, + "end": 86.6, + "confidence": 0.946 + }, + { + "text": "got", + "start": 86.6, + "end": 86.64, + "confidence": 0.947 + }, + { + "text": "them,", + "start": 86.64, + "end": 86.68, + "confidence": 0.948 + }, + { + "text": "got", + "start": 86.68, + "end": 86.72, + "confidence": 0.941 + }, + { + "text": "them,", + "start": 86.72, + "end": 86.76, + "confidence": 0.953 + }, + { + "text": "got", + "start": 86.76, + "end": 86.8, + "confidence": 0.942 + }, + { + "text": "them,", + "start": 86.8, + "end": 86.84, + "confidence": 0.956 + }, + { + "text": "got", + "start": 86.84, + "end": 86.88, + "confidence": 0.942 + }, + { + "text": "them,", + "start": 86.88, + "end": 86.92, + "confidence": 0.961 + }, + { + "text": "got", + "start": 86.92, + "end": 86.96, + "confidence": 0.942 + }, + { + "text": "them,", + "start": 86.96, + "end": 87.0, + "confidence": 0.964 + }, + { + "text": "got", + "start": 87.0, + "end": 87.04, + "confidence": 0.945 + }, + { + "text": "them,", + "start": 87.04, + "end": 87.08, + "confidence": 0.967 + }, + { + "text": "got", + "start": 87.08, + "end": 87.12, + "confidence": 0.948 + }, + { + "text": "them,", + "start": 87.12, + "end": 87.16, + "confidence": 0.969 + }, + { + "text": "got", + "start": 87.16, + "end": 87.2, + "confidence": 0.951 + }, + { + "text": "them,", + "start": 87.2, + "end": 87.24, + "confidence": 0.972 + }, + { + "text": "got", + "start": 87.24, + "end": 87.28, + "confidence": 0.951 + }, + { + "text": "them,", + "start": 87.28, + "end": 87.32, + "confidence": 0.976 + }, + { + "text": "got", + "start": 87.32, + "end": 87.36, + "confidence": 0.951 + }, + { + "text": "them,", + "start": 87.36, + "end": 87.4, + "confidence": 0.976 + }, + { + "text": "got", + "start": 87.4, + "end": 87.44, + "confidence": 0.951 + }, + { + "text": "them,", + "start": 87.44, + "end": 87.48, + "confidence": 0.977 + }, + { + "text": "got", + "start": 87.48, + "end": 87.52, + "confidence": 0.954 + }, + { + "text": "them,", + "start": 87.52, + "end": 87.56, + "confidence": 0.978 + }, + { + "text": "got", + "start": 87.56, + "end": 87.6, + "confidence": 0.954 + }, + { + "text": "them,", + "start": 87.6, + "end": 87.64, + "confidence": 0.98 + }, + { + "text": "got", + "start": 87.64, + "end": 87.68, + "confidence": 0.956 + }, + { + "text": "them,", + "start": 87.68, + "end": 87.72, + "confidence": 0.98 + }, + { + "text": "got", + "start": 87.72, + "end": 87.76, + "confidence": 0.957 + }, + { + "text": "them,", + "start": 87.76, + "end": 87.8, + "confidence": 0.981 + }, + { + "text": "got", + "start": 87.8, + "end": 87.84, + "confidence": 0.958 + }, + { + "text": "them,", + "start": 87.84, + "end": 87.88, + "confidence": 0.982 + }, + { + "text": "got", + "start": 87.88, + "end": 87.92, + "confidence": 0.959 + }, + { + "text": "them,", + "start": 87.92, + "end": 87.96, + "confidence": 0.983 + }, + { + "text": "got", + "start": 87.96, + "end": 88.0, + "confidence": 0.961 + }, + { + "text": "them,", + "start": 88.0, + "end": 88.04, + "confidence": 0.983 + }, + { + "text": "got", + "start": 88.04, + "end": 88.08, + "confidence": 0.963 + }, + { + "text": "them,", + "start": 88.08, + "end": 88.12, + "confidence": 0.983 + }, + { + "text": "got", + "start": 88.12, + "end": 88.16, + "confidence": 0.965 + }, + { + "text": "them,", + "start": 88.16, + "end": 88.2, + "confidence": 0.984 + }, + { + "text": "got", + "start": 88.2, + "end": 88.24, + "confidence": 0.966 + }, + { + "text": "them,", + "start": 88.24, + "end": 88.28, + "confidence": 0.984 + }, + { + "text": "got", + "start": 88.28, + "end": 88.32, + "confidence": 0.968 + }, + { + "text": "them,", + "start": 88.32, + "end": 88.36, + "confidence": 0.986 + }, + { + "text": "got", + "start": 88.36, + "end": 88.4, + "confidence": 0.97 + }, + { + "text": "them,", + "start": 88.4, + "end": 88.44, + "confidence": 0.986 + }, + { + "text": "got", + "start": 88.44, + "end": 88.48, + "confidence": 0.971 + }, + { + "text": "them,", + "start": 88.48, + "end": 88.52, + "confidence": 0.986 + }, + { + "text": "got", + "start": 88.52, + "end": 88.56, + "confidence": 0.973 + }, + { + "text": "them,", + "start": 88.56, + "end": 88.6, + "confidence": 0.987 + }, + { + "text": "got", + "start": 88.6, + "end": 88.64, + "confidence": 0.975 + }, + { + "text": "them,", + "start": 88.64, + "end": 88.68, + "confidence": 0.987 + }, + { + "text": "got", + "start": 88.68, + "end": 88.72, + "confidence": 0.977 + }, + { + "text": "them,", + "start": 88.72, + "end": 88.76, + "confidence": 0.988 + }, + { + "text": "got", + "start": 88.76, + "end": 88.8, + "confidence": 0.978 + }, + { + "text": "them,", + "start": 88.8, + "end": 88.84, + "confidence": 0.988 + }, + { + "text": "got", + "start": 88.84, + "end": 88.88, + "confidence": 0.981 + }, + { + "text": "them,", + "start": 88.88, + "end": 88.92, + "confidence": 0.989 + }, + { + "text": "got", + "start": 88.92, + "end": 88.96, + "confidence": 0.982 + }, + { + "text": "them,", + "start": 88.96, + "end": 89.0, + "confidence": 0.989 + }, + { + "text": "got", + "start": 89.0, + "end": 89.04, + "confidence": 0.983 + }, + { + "text": "them,", + "start": 89.04, + "end": 89.08, + "confidence": 0.989 + }, + { + "text": "got", + "start": 89.08, + "end": 89.12, + "confidence": 0.985 + }, + { + "text": "them,", + "start": 89.12, + "end": 89.16, + "confidence": 0.989 + }, + { + "text": "got", + "start": 89.16, + "end": 89.2, + "confidence": 0.987 + }, + { + "text": "them,", + "start": 89.2, + "end": 89.24, + "confidence": 0.99 + }, + { + "text": "got", + "start": 89.24, + "end": 89.28, + "confidence": 0.988 + }, + { + "text": "them,", + "start": 89.28, + "end": 89.32, + "confidence": 0.991 + }, + { + "text": "got", + "start": 89.32, + "end": 89.36, + "confidence": 0.988 + }, + { + "text": "them,", + "start": 89.36, + "end": 89.4, + "confidence": 0.991 + }, + { + "text": "got", + "start": 89.4, + "end": 89.44, + "confidence": 0.99 + }, + { + "text": "them,", + "start": 89.44, + "end": 89.48, + "confidence": 0.991 + }, + { + "text": "got", + "start": 89.48, + "end": 89.52, + "confidence": 0.99 + }, + { + "text": "them,", + "start": 89.52, + "end": 89.56, + "confidence": 0.991 + }, + { + "text": "got", + "start": 89.56, + "end": 89.6, + "confidence": 0.991 + }, + { + "text": "them,", + "start": 89.6, + "end": 89.64, + "confidence": 0.992 + }, + { + "text": "got", + "start": 89.64, + "end": 89.68, + "confidence": 0.991 + }, + { + "text": "them,", + "start": 89.68, + "end": 89.72, + "confidence": 0.992 + }, + { + "text": "got", + "start": 89.72, + "end": 89.76, + "confidence": 0.992 + }, + { + "text": "them,", + "start": 89.76, + "end": 89.8, + "confidence": 0.992 + }, + { + "text": "got", + "start": 89.8, + "end": 89.84, + "confidence": 0.993 + }, + { + "text": "them,", + "start": 89.84, + "end": 89.88, + "confidence": 0.992 + }, + { + "text": "got", + "start": 89.88, + "end": 89.92, + "confidence": 0.993 + }, + { + "text": "them,", + "start": 89.92, + "end": 89.96, + "confidence": 0.993 + }, + { + "text": "got", + "start": 89.96, + "end": 90.0, + "confidence": 0.993 + }, + { + "text": "them,", + "start": 90.0, + "end": 90.04, + "confidence": 0.993 + }, + { + "text": "got", + "start": 90.04, + "end": 90.08, + "confidence": 0.994 + }, + { + "text": "them,", + "start": 90.08, + "end": 90.12, + "confidence": 0.993 + }, + { + "text": "got", + "start": 90.12, + "end": 90.16, + "confidence": 0.994 + }, + { + "text": "them,", + "start": 90.16, + "end": 90.2, + "confidence": 0.993 + }, + { + "text": "got", + "start": 90.2, + "end": 90.24, + "confidence": 0.994 + }, + { + "text": "them,", + "start": 90.24, + "end": 90.28, + "confidence": 0.994 + }, + { + "text": "got", + "start": 90.28, + "end": 90.32, + "confidence": 0.994 + }, + { + "text": "them,", + "start": 90.32, + "end": 90.36, + "confidence": 0.993 + }, + { + "text": "got", + "start": 90.36, + "end": 90.4, + "confidence": 0.994 + }, + { + "text": "them,", + "start": 90.4, + "end": 90.44, + "confidence": 0.993 + }, + { + "text": "got", + "start": 90.44, + "end": 90.48, + "confidence": 0.994 + }, + { + "text": "them,", + "start": 90.48, + "end": 90.52, + "confidence": 0.994 + }, + { + "text": "got", + "start": 90.52, + "end": 90.56, + "confidence": 0.994 + }, + { + "text": "them,", + "start": 90.56, + "end": 90.6, + "confidence": 0.994 + }, + { + "text": "got", + "start": 90.6, + "end": 90.64, + "confidence": 0.995 + }, + { + "text": "them,", + "start": 90.64, + "end": 90.68, + "confidence": 0.994 + }, + { + "text": "got", + "start": 90.68, + "end": 90.72, + "confidence": 0.995 + }, + { + "text": "them,", + "start": 90.72, + "end": 90.76, + "confidence": 0.994 + }, + { + "text": "got", + "start": 90.76, + "end": 90.8, + "confidence": 0.995 + }, + { + "text": "them,", + "start": 90.8, + "end": 90.84, + "confidence": 0.994 + }, + { + "text": "got", + "start": 90.84, + "end": 90.88, + "confidence": 0.995 + }, + { + "text": "them,", + "start": 90.88, + "end": 90.92, + "confidence": 0.994 + }, + { + "text": "got", + "start": 90.92, + "end": 90.96, + "confidence": 0.995 + }, + { + "text": "them,", + "start": 90.96, + "end": 91.0, + "confidence": 0.994 + }, + { + "text": "got", + "start": 91.0, + "end": 91.04, + "confidence": 0.995 + }, + { + "text": "them,", + "start": 91.04, + "end": 91.08, + "confidence": 0.994 + }, + { + "text": "got", + "start": 91.08, + "end": 91.12, + "confidence": 0.995 + }, + { + "text": "them", + "start": 91.12, + "end": 91.16, + "confidence": 0.998 + } + ] + } + ], + "language": "en" +} \ No newline at end of file diff --git a/tests/expected/naive.cuda/accurate_apollo11.mp3.words.json b/tests/expected/naive.cuda/accurate_apollo11.mp3.words.json new file mode 100644 index 0000000000000000000000000000000000000000..5541228558b3a625658b695ccc9b63cdd745f928 --- /dev/null +++ b/tests/expected/naive.cuda/accurate_apollo11.mp3.words.json @@ -0,0 +1,2438 @@ +{ + "text": " Apollo 11, Houston, we got a recommendation for you on your Soyuz-EA GLEM-E-G-E-A. All right. Okay. Yeah, sir. Yeah, sir. Let's take that camera. Let's say it makes it want to go on the helmet we were going to have in B-1. The other one. And you can put the other one on the mic helmet. We'll show it to you in a quick screen. Over. All right. Yeah, sir. All right. Yeah, sir. There's a better helmet than B-1. That's the other one. Nice. Let's go in there. At least we're safe. We've got them in there. Helmet bags. And, uh, I guess we have helmets in the helmet bag. At least it's in the helmet bag. Right here. Right here. Yeah, we're taking it next day out of the field up. Yeah, we were. You want to hack me on that? Yeah, we were. You want to hack me on that? With the cover, I tried it already. Okay, fine. We weren't sure of that. Just a suggestion. We thought we'd, uh, say you could check it out. It's not much of an order to turn that. So, uh, I guess we're going to come up with this. Let us know. Okay. No problem. Okay. No problem. No problem. No problem. No problem. No problem. No problem. No problem.", + "segments": [ + { + "id": 0, + "seek": 0, + "start": 0.64, + "end": 6.76, + "text": " Apollo 11, Houston, we got a recommendation for you on your Soyuz-EA GLEM-E-G-E-A.", + "tokens": [ + 25187, + 2975, + 11, + 18717, + 11, + 321, + 658, + 257, + 11879, + 337, + 291, + 322, + 428, + 24758, + 3334, + 12, + 36, + 32, + 460, + 2634, + 44, + 12, + 36, + 12, + 38, + 12, + 36, + 12, + 32, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.5338267664755544, + "compression_ratio": 1.4690265486725664, + "no_speech_prob": 0.4499393105506897, + "confidence": 0.578, + "words": [ + { + "text": "Apollo", + "start": 0.64, + "end": 0.98, + "confidence": 0.425 + }, + { + "text": "11,", + "start": 0.98, + "end": 1.52, + "confidence": 0.842 + }, + { + "text": "Houston,", + "start": 1.52, + "end": 1.94, + "confidence": 0.665 + }, + { + "text": "we", + "start": 1.94, + "end": 1.98, + "confidence": 0.983 + }, + { + "text": "got", + "start": 1.98, + "end": 2.16, + "confidence": 0.743 + }, + { + "text": "a", + "start": 2.16, + "end": 2.32, + "confidence": 0.993 + }, + { + "text": "recommendation", + "start": 2.32, + "end": 3.08, + "confidence": 0.977 + }, + { + "text": "for", + "start": 3.08, + "end": 3.5, + "confidence": 0.94 + }, + { + "text": "you", + "start": 3.5, + "end": 3.72, + "confidence": 0.993 + }, + { + "text": "on", + "start": 3.72, + "end": 4.26, + "confidence": 0.918 + }, + { + "text": "your", + "start": 4.26, + "end": 4.3, + "confidence": 0.976 + }, + { + "text": "Soyuz-EA", + "start": 4.3, + "end": 5.36, + "confidence": 0.455 + }, + { + "text": "GLEM-E-G-E-A.", + "start": 5.36, + "end": 6.76, + "confidence": 0.436 + } + ] + }, + { + "id": 1, + "seek": 0, + "start": 10.82, + "end": 10.9, + "text": " All right.", + "tokens": [ + 1057, + 558, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.5338267664755544, + "compression_ratio": 1.4690265486725664, + "no_speech_prob": 0.4499393105506897, + "confidence": 0.149, + "words": [ + { + "text": "All", + "start": 10.82, + "end": 10.86, + "confidence": 0.006 + }, + { + "text": "right.", + "start": 10.86, + "end": 10.9, + "confidence": 0.72 + } + ] + }, + { + "id": 2, + "seek": 0, + "start": 12.02, + "end": 12.06, + "text": " Okay.", + "tokens": [ + 1033, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.5338267664755544, + "compression_ratio": 1.4690265486725664, + "no_speech_prob": 0.4499393105506897, + "confidence": 0.168, + "words": [ + { + "text": "Okay.", + "start": 12.02, + "end": 12.06, + "confidence": 0.168 + } + ] + }, + { + "id": 3, + "seek": 0, + "start": 12.08, + "end": 13.44, + "text": " Yeah, sir.", + "tokens": [ + 865, + 11, + 4735, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.5338267664755544, + "compression_ratio": 1.4690265486725664, + "no_speech_prob": 0.4499393105506897, + "confidence": 0.131, + "words": [ + { + "text": "Yeah,", + "start": 12.08, + "end": 12.68, + "confidence": 0.079 + }, + { + "text": "sir.", + "start": 12.68, + "end": 13.44, + "confidence": 0.218 + } + ] + }, + { + "id": 4, + "seek": 0, + "start": 13.66, + "end": 14.28, + "text": " Yeah, sir.", + "tokens": [ + 865, + 11, + 4735, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.5338267664755544, + "compression_ratio": 1.4690265486725664, + "no_speech_prob": 0.4499393105506897, + "confidence": 0.047, + "words": [ + { + "text": "Yeah,", + "start": 13.66, + "end": 13.82, + "confidence": 0.11 + }, + { + "text": "sir.", + "start": 13.82, + "end": 14.28, + "confidence": 0.02 + } + ] + }, + { + "id": 5, + "seek": 0, + "start": 14.3, + "end": 14.98, + "text": " Let's take that camera.", + "tokens": [ + 961, + 311, + 747, + 300, + 2799, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.5338267664755544, + "compression_ratio": 1.4690265486725664, + "no_speech_prob": 0.4499393105506897, + "confidence": 0.033, + "words": [ + { + "text": "Let's", + "start": 14.3, + "end": 14.54, + "confidence": 0.036 + }, + { + "text": "take", + "start": 14.54, + "end": 14.58, + "confidence": 0.026 + }, + { + "text": "that", + "start": 14.58, + "end": 14.62, + "confidence": 0.031 + }, + { + "text": "camera.", + "start": 14.62, + "end": 14.98, + "confidence": 0.034 + } + ] + }, + { + "id": 6, + "seek": 0, + "start": 15.0, + "end": 19.22, + "text": " Let's say it makes it want to go on the helmet we were going to have in B-1.", + "tokens": [ + 961, + 311, + 584, + 309, + 1669, + 309, + 528, + 281, + 352, + 322, + 264, + 15922, + 321, + 645, + 516, + 281, + 362, + 294, + 363, + 12, + 16, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.5338267664755544, + "compression_ratio": 1.4690265486725664, + "no_speech_prob": 0.4499393105506897, + "confidence": 0.299, + "words": [ + { + "text": "Let's", + "start": 15.0, + "end": 15.38, + "confidence": 0.273 + }, + { + "text": "say", + "start": 15.38, + "end": 15.58, + "confidence": 0.349 + }, + { + "text": "it", + "start": 15.58, + "end": 15.76, + "confidence": 0.01 + }, + { + "text": "makes", + "start": 15.76, + "end": 15.8, + "confidence": 0.736 + }, + { + "text": "it", + "start": 15.8, + "end": 16.04, + "confidence": 0.921 + }, + { + "text": "want", + "start": 16.04, + "end": 16.16, + "confidence": 0.297 + }, + { + "text": "to", + "start": 16.16, + "end": 16.34, + "confidence": 0.97 + }, + { + "text": "go", + "start": 16.34, + "end": 16.44, + "confidence": 0.932 + }, + { + "text": "on", + "start": 16.44, + "end": 16.74, + "confidence": 0.912 + }, + { + "text": "the", + "start": 16.74, + "end": 16.86, + "confidence": 0.496 + }, + { + "text": "helmet", + "start": 16.86, + "end": 17.34, + "confidence": 0.005 + }, + { + "text": "we", + "start": 17.34, + "end": 17.64, + "confidence": 0.01 + }, + { + "text": "were", + "start": 17.64, + "end": 17.86, + "confidence": 0.08 + }, + { + "text": "going", + "start": 17.86, + "end": 18.04, + "confidence": 0.658 + }, + { + "text": "to", + "start": 18.04, + "end": 18.2, + "confidence": 0.966 + }, + { + "text": "have", + "start": 18.2, + "end": 18.26, + "confidence": 0.957 + }, + { + "text": "in", + "start": 18.26, + "end": 18.64, + "confidence": 0.863 + }, + { + "text": "B-1.", + "start": 18.64, + "end": 19.22, + "confidence": 0.506 + } + ] + }, + { + "id": 7, + "seek": 0, + "start": 19.38, + "end": 19.98, + "text": " The other one.", + "tokens": [ + 440, + 661, + 472, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.5338267664755544, + "compression_ratio": 1.4690265486725664, + "no_speech_prob": 0.4499393105506897, + "confidence": 0.13, + "words": [ + { + "text": "The", + "start": 19.38, + "end": 19.42, + "confidence": 0.005 + }, + { + "text": "other", + "start": 19.42, + "end": 19.68, + "confidence": 0.186 + }, + { + "text": "one.", + "start": 19.68, + "end": 19.98, + "confidence": 0.586 + } + ] + }, + { + "id": 8, + "seek": 0, + "start": 20.12, + "end": 22.9, + "text": " And you can put the other one on the mic helmet.", + "tokens": [ + 400, + 291, + 393, + 829, + 264, + 661, + 472, + 322, + 264, + 3123, + 15922, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.5338267664755544, + "compression_ratio": 1.4690265486725664, + "no_speech_prob": 0.4499393105506897, + "confidence": 0.366, + "words": [ + { + "text": "And", + "start": 20.12, + "end": 20.26, + "confidence": 0.343 + }, + { + "text": "you", + "start": 20.26, + "end": 20.38, + "confidence": 0.89 + }, + { + "text": "can", + "start": 20.38, + "end": 20.54, + "confidence": 0.087 + }, + { + "text": "put", + "start": 20.54, + "end": 20.7, + "confidence": 0.901 + }, + { + "text": "the", + "start": 20.7, + "end": 20.86, + "confidence": 0.979 + }, + { + "text": "other", + "start": 20.86, + "end": 21.06, + "confidence": 0.997 + }, + { + "text": "one", + "start": 21.06, + "end": 21.26, + "confidence": 0.973 + }, + { + "text": "on", + "start": 21.26, + "end": 21.9, + "confidence": 0.968 + }, + { + "text": "the", + "start": 21.9, + "end": 21.94, + "confidence": 0.09 + }, + { + "text": "mic", + "start": 21.94, + "end": 22.58, + "confidence": 0.682 + }, + { + "text": "helmet.", + "start": 22.58, + "end": 22.9, + "confidence": 0.066 + } + ] + }, + { + "id": 9, + "seek": 0, + "start": 22.92, + "end": 24.8, + "text": " We'll show it to you in a quick screen.", + "tokens": [ + 492, + 603, + 855, + 309, + 281, + 291, + 294, + 257, + 1702, + 2568, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.5338267664755544, + "compression_ratio": 1.4690265486725664, + "no_speech_prob": 0.4499393105506897, + "confidence": 0.122, + "words": [ + { + "text": "We'll", + "start": 22.92, + "end": 23.22, + "confidence": 0.08 + }, + { + "text": "show", + "start": 23.22, + "end": 23.32, + "confidence": 0.011 + }, + { + "text": "it", + "start": 23.32, + "end": 23.54, + "confidence": 0.15 + }, + { + "text": "to", + "start": 23.54, + "end": 23.64, + "confidence": 0.255 + }, + { + "text": "you", + "start": 23.64, + "end": 23.78, + "confidence": 0.703 + }, + { + "text": "in", + "start": 23.78, + "end": 23.96, + "confidence": 0.231 + }, + { + "text": "a", + "start": 23.96, + "end": 24.12, + "confidence": 0.736 + }, + { + "text": "quick", + "start": 24.12, + "end": 24.16, + "confidence": 0.018 + }, + { + "text": "screen.", + "start": 24.16, + "end": 24.8, + "confidence": 0.122 + } + ] + }, + { + "id": 10, + "seek": 0, + "start": 24.94, + "end": 25.26, + "text": " Over.", + "tokens": [ + 4886, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.5338267664755544, + "compression_ratio": 1.4690265486725664, + "no_speech_prob": 0.4499393105506897, + "confidence": 0.125, + "words": [ + { + "text": "Over.", + "start": 24.94, + "end": 25.26, + "confidence": 0.125 + } + ] + }, + { + "id": 11, + "seek": 2600, + "start": 25.52, + "end": 27.52, + "text": " All right.", + "tokens": [ + 1057, + 558, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.5128642573501124, + "compression_ratio": 1.728643216080402, + "no_speech_prob": 0.0011020583333447576, + "confidence": 0.108, + "words": [ + { + "text": "All", + "start": 25.52, + "end": 26.14, + "confidence": 0.003 + }, + { + "text": "right.", + "start": 26.14, + "end": 27.52, + "confidence": 0.677 + } + ] + }, + { + "id": 12, + "seek": 2600, + "start": 31.32, + "end": 32.48, + "text": " Yeah, sir.", + "tokens": [ + 865, + 11, + 4735, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.5128642573501124, + "compression_ratio": 1.728643216080402, + "no_speech_prob": 0.0011020583333447576, + "confidence": 0.045, + "words": [ + { + "text": "Yeah,", + "start": 31.32, + "end": 31.56, + "confidence": 0.033 + }, + { + "text": "sir.", + "start": 31.56, + "end": 32.48, + "confidence": 0.062 + } + ] + }, + { + "id": 13, + "seek": 2600, + "start": 32.66, + "end": 33.06, + "text": " All right.", + "tokens": [ + 1057, + 558, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.5128642573501124, + "compression_ratio": 1.728643216080402, + "no_speech_prob": 0.0011020583333447576, + "confidence": 0.223, + "words": [ + { + "text": "All", + "start": 32.66, + "end": 32.94, + "confidence": 0.047 + }, + { + "text": "right.", + "start": 32.94, + "end": 33.06, + "confidence": 0.488 + } + ] + }, + { + "id": 14, + "seek": 2600, + "start": 33.08, + "end": 34.2, + "text": " Yeah, sir.", + "tokens": [ + 865, + 11, + 4735, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.5128642573501124, + "compression_ratio": 1.728643216080402, + "no_speech_prob": 0.0011020583333447576, + "confidence": 0.035, + "words": [ + { + "text": "Yeah,", + "start": 33.08, + "end": 33.36, + "confidence": 0.144 + }, + { + "text": "sir.", + "start": 33.36, + "end": 34.2, + "confidence": 0.009 + } + ] + }, + { + "id": 15, + "seek": 2600, + "start": 34.52, + "end": 35.4, + "text": " There's a better helmet than B-1.", + "tokens": [ + 821, + 311, + 257, + 1101, + 15922, + 813, + 363, + 12, + 16, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.5128642573501124, + "compression_ratio": 1.728643216080402, + "no_speech_prob": 0.0011020583333447576, + "confidence": 0.014, + "words": [ + { + "text": "There's", + "start": 34.52, + "end": 34.56, + "confidence": 0.046 + }, + { + "text": "a", + "start": 34.56, + "end": 34.64, + "confidence": 0.037 + }, + { + "text": "better", + "start": 34.64, + "end": 34.94, + "confidence": 0.0 + }, + { + "text": "helmet", + "start": 34.94, + "end": 34.98, + "confidence": 0.0 + }, + { + "text": "than", + "start": 34.98, + "end": 35.02, + "confidence": 0.179 + }, + { + "text": "B-1.", + "start": 35.02, + "end": 35.4, + "confidence": 0.033 + } + ] + }, + { + "id": 16, + "seek": 2600, + "start": 35.42, + "end": 35.94, + "text": " That's the other one.", + "tokens": [ + 663, + 311, + 264, + 661, + 472, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.5128642573501124, + "compression_ratio": 1.728643216080402, + "no_speech_prob": 0.0011020583333447576, + "confidence": 0.162, + "words": [ + { + "text": "That's", + "start": 35.42, + "end": 35.48, + "confidence": 0.082 + }, + { + "text": "the", + "start": 35.48, + "end": 35.52, + "confidence": 0.167 + }, + { + "text": "other", + "start": 35.52, + "end": 35.68, + "confidence": 0.412 + }, + { + "text": "one.", + "start": 35.68, + "end": 35.94, + "confidence": 0.197 + } + ] + }, + { + "id": 17, + "seek": 2600, + "start": 35.96, + "end": 36.34, + "text": " Nice.", + "tokens": [ + 5490, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.5128642573501124, + "compression_ratio": 1.728643216080402, + "no_speech_prob": 0.0011020583333447576, + "confidence": 0.007, + "words": [ + { + "text": "Nice.", + "start": 35.96, + "end": 36.34, + "confidence": 0.007 + } + ] + }, + { + "id": 18, + "seek": 2600, + "start": 37.68, + "end": 38.48, + "text": " Let's go in there.", + "tokens": [ + 961, + 311, + 352, + 294, + 456, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.5128642573501124, + "compression_ratio": 1.728643216080402, + "no_speech_prob": 0.0011020583333447576, + "confidence": 0.125, + "words": [ + { + "text": "Let's", + "start": 37.68, + "end": 38.16, + "confidence": 0.022 + }, + { + "text": "go", + "start": 38.16, + "end": 38.2, + "confidence": 0.626 + }, + { + "text": "in", + "start": 38.2, + "end": 38.24, + "confidence": 0.037 + }, + { + "text": "there.", + "start": 38.24, + "end": 38.48, + "confidence": 0.579 + } + ] + }, + { + "id": 19, + "seek": 2600, + "start": 38.6, + "end": 39.24, + "text": " At least we're safe.", + "tokens": [ + 1711, + 1935, + 321, + 434, + 3273, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.5128642573501124, + "compression_ratio": 1.728643216080402, + "no_speech_prob": 0.0011020583333447576, + "confidence": 0.125, + "words": [ + { + "text": "At", + "start": 38.6, + "end": 38.64, + "confidence": 0.001 + }, + { + "text": "least", + "start": 38.64, + "end": 38.86, + "confidence": 0.311 + }, + { + "text": "we're", + "start": 38.86, + "end": 39.08, + "confidence": 0.12 + }, + { + "text": "safe.", + "start": 39.08, + "end": 39.24, + "confidence": 0.799 + } + ] + }, + { + "id": 20, + "seek": 2600, + "start": 39.94, + "end": 40.54, + "text": " We've got them in there.", + "tokens": [ + 492, + 600, + 658, + 552, + 294, + 456, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.5128642573501124, + "compression_ratio": 1.728643216080402, + "no_speech_prob": 0.0011020583333447576, + "confidence": 0.076, + "words": [ + { + "text": "We've", + "start": 39.94, + "end": 40.38, + "confidence": 0.06 + }, + { + "text": "got", + "start": 40.38, + "end": 40.42, + "confidence": 0.737 + }, + { + "text": "them", + "start": 40.42, + "end": 40.46, + "confidence": 0.004 + }, + { + "text": "in", + "start": 40.46, + "end": 40.5, + "confidence": 0.039 + }, + { + "text": "there.", + "start": 40.5, + "end": 40.54, + "confidence": 0.198 + } + ] + }, + { + "id": 21, + "seek": 2600, + "start": 40.54, + "end": 41.28, + "text": " Helmet bags.", + "tokens": [ + 6128, + 5537, + 10405, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.5128642573501124, + "compression_ratio": 1.728643216080402, + "no_speech_prob": 0.0011020583333447576, + "confidence": 0.001, + "words": [ + { + "text": "Helmet", + "start": 40.54, + "end": 40.78, + "confidence": 0.001 + }, + { + "text": "bags.", + "start": 40.78, + "end": 41.28, + "confidence": 0.002 + } + ] + }, + { + "id": 22, + "seek": 2600, + "start": 43.52, + "end": 47.74, + "text": " And, uh, I guess we have helmets in the helmet bag.", + "tokens": [ + 400, + 11, + 2232, + 11, + 286, + 2041, + 321, + 362, + 42022, + 294, + 264, + 15922, + 3411, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.5128642573501124, + "compression_ratio": 1.728643216080402, + "no_speech_prob": 0.0011020583333447576, + "confidence": 0.208, + "words": [ + { + "text": "And,", + "start": 43.52, + "end": 43.56, + "confidence": 0.087 + }, + { + "text": "uh,", + "start": 43.56, + "end": 44.02, + "confidence": 0.767 + }, + { + "text": "I", + "start": 44.02, + "end": 44.06, + "confidence": 0.321 + }, + { + "text": "guess", + "start": 44.06, + "end": 44.32, + "confidence": 0.236 + }, + { + "text": "we", + "start": 44.32, + "end": 45.0, + "confidence": 0.078 + }, + { + "text": "have", + "start": 45.0, + "end": 45.6, + "confidence": 0.06 + }, + { + "text": "helmets", + "start": 45.6, + "end": 46.62, + "confidence": 0.004 + }, + { + "text": "in", + "start": 46.62, + "end": 46.82, + "confidence": 0.6 + }, + { + "text": "the", + "start": 46.82, + "end": 46.98, + "confidence": 0.614 + }, + { + "text": "helmet", + "start": 46.98, + "end": 47.2, + "confidence": 0.823 + }, + { + "text": "bag.", + "start": 47.2, + "end": 47.74, + "confidence": 0.363 + } + ] + }, + { + "id": 23, + "seek": 2600, + "start": 48.24, + "end": 49.84, + "text": " At least it's in the helmet bag.", + "tokens": [ + 1711, + 1935, + 309, + 311, + 294, + 264, + 15922, + 3411, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.5128642573501124, + "compression_ratio": 1.728643216080402, + "no_speech_prob": 0.0011020583333447576, + "confidence": 0.112, + "words": [ + { + "text": "At", + "start": 48.24, + "end": 48.38, + "confidence": 0.064 + }, + { + "text": "least", + "start": 48.38, + "end": 48.66, + "confidence": 0.795 + }, + { + "text": "it's", + "start": 48.66, + "end": 49.02, + "confidence": 0.347 + }, + { + "text": "in", + "start": 49.02, + "end": 49.06, + "confidence": 0.172 + }, + { + "text": "the", + "start": 49.06, + "end": 49.1, + "confidence": 0.242 + }, + { + "text": "helmet", + "start": 49.1, + "end": 49.22, + "confidence": 0.003 + }, + { + "text": "bag.", + "start": 49.22, + "end": 49.84, + "confidence": 0.062 + } + ] + }, + { + "id": 24, + "seek": 2600, + "start": 50.22, + "end": 50.94, + "text": " Right here.", + "tokens": [ + 1779, + 510, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.5128642573501124, + "compression_ratio": 1.728643216080402, + "no_speech_prob": 0.0011020583333447576, + "confidence": 0.099, + "words": [ + { + "text": "Right", + "start": 50.22, + "end": 50.48, + "confidence": 0.006 + }, + { + "text": "here.", + "start": 50.48, + "end": 50.94, + "confidence": 0.416 + } + ] + }, + { + "id": 25, + "seek": 2600, + "start": 51.54, + "end": 52.24, + "text": " Right here.", + "tokens": [ + 1779, + 510, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.5128642573501124, + "compression_ratio": 1.728643216080402, + "no_speech_prob": 0.0011020583333447576, + "confidence": 0.04, + "words": [ + { + "text": "Right", + "start": 51.54, + "end": 51.8, + "confidence": 0.008 + }, + { + "text": "here.", + "start": 51.8, + "end": 52.24, + "confidence": 0.091 + } + ] + }, + { + "id": 26, + "seek": 2600, + "start": 53.2, + "end": 55.42, + "text": " Yeah, we're taking it next day out of the field up.", + "tokens": [ + 865, + 11, + 321, + 434, + 1940, + 309, + 958, + 786, + 484, + 295, + 264, + 2519, + 493, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.5128642573501124, + "compression_ratio": 1.728643216080402, + "no_speech_prob": 0.0011020583333447576, + "confidence": 0.367, + "words": [ + { + "text": "Yeah,", + "start": 53.2, + "end": 53.38, + "confidence": 0.47 + }, + { + "text": "we're", + "start": 53.38, + "end": 53.7, + "confidence": 0.742 + }, + { + "text": "taking", + "start": 53.7, + "end": 53.74, + "confidence": 0.322 + }, + { + "text": "it", + "start": 53.74, + "end": 53.86, + "confidence": 0.082 + }, + { + "text": "next", + "start": 53.86, + "end": 53.96, + "confidence": 0.545 + }, + { + "text": "day", + "start": 53.96, + "end": 54.16, + "confidence": 0.817 + }, + { + "text": "out", + "start": 54.16, + "end": 54.32, + "confidence": 0.29 + }, + { + "text": "of", + "start": 54.32, + "end": 54.54, + "confidence": 0.351 + }, + { + "text": "the", + "start": 54.54, + "end": 54.68, + "confidence": 0.432 + }, + { + "text": "field", + "start": 54.68, + "end": 55.2, + "confidence": 0.233 + }, + { + "text": "up.", + "start": 55.2, + "end": 55.42, + "confidence": 0.235 + } + ] + }, + { + "id": 27, + "seek": 5500, + "start": 55.44, + "end": 56.12, + "text": " Yeah, we were.", + "tokens": [ + 865, + 11, + 321, + 645, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.31608172647314137, + "compression_ratio": 1.8318181818181818, + "no_speech_prob": 0.00039152163662947714, + "confidence": 0.02, + "words": [ + { + "text": "Yeah,", + "start": 55.44, + "end": 55.48, + "confidence": 0.024 + }, + { + "text": "we", + "start": 55.48, + "end": 55.52, + "confidence": 0.022 + }, + { + "text": "were.", + "start": 55.52, + "end": 56.12, + "confidence": 0.017 + } + ] + }, + { + "id": 28, + "seek": 5500, + "start": 56.5, + "end": 57.48, + "text": " You want to hack me on that?", + "tokens": [ + 509, + 528, + 281, + 10339, + 385, + 322, + 300, + 30 + ], + "temperature": 0.0, + "avg_logprob": -0.31608172647314137, + "compression_ratio": 1.8318181818181818, + "no_speech_prob": 0.00039152163662947714, + "confidence": 0.019, + "words": [ + { + "text": "You", + "start": 56.5, + "end": 56.62, + "confidence": 0.007 + }, + { + "text": "want", + "start": 56.62, + "end": 57.0, + "confidence": 0.01 + }, + { + "text": "to", + "start": 57.0, + "end": 57.22, + "confidence": 0.257 + }, + { + "text": "hack", + "start": 57.22, + "end": 57.36, + "confidence": 0.0 + }, + { + "text": "me", + "start": 57.36, + "end": 57.4, + "confidence": 0.054 + }, + { + "text": "on", + "start": 57.4, + "end": 57.44, + "confidence": 0.005 + }, + { + "text": "that?", + "start": 57.44, + "end": 57.48, + "confidence": 0.22 + } + ] + }, + { + "id": 29, + "seek": 5500, + "start": 57.48, + "end": 58.26, + "text": " Yeah, we were.", + "tokens": [ + 865, + 11, + 321, + 645, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.31608172647314137, + "compression_ratio": 1.8318181818181818, + "no_speech_prob": 0.00039152163662947714, + "confidence": 0.047, + "words": [ + { + "text": "Yeah,", + "start": 57.48, + "end": 57.96, + "confidence": 0.029 + }, + { + "text": "we", + "start": 57.96, + "end": 58.06, + "confidence": 0.096 + }, + { + "text": "were.", + "start": 58.06, + "end": 58.26, + "confidence": 0.053 + } + ] + }, + { + "id": 30, + "seek": 5500, + "start": 58.28, + "end": 59.48, + "text": " You want to hack me on that?", + "tokens": [ + 509, + 528, + 281, + 10339, + 385, + 322, + 300, + 30 + ], + "temperature": 0.0, + "avg_logprob": -0.31608172647314137, + "compression_ratio": 1.8318181818181818, + "no_speech_prob": 0.00039152163662947714, + "confidence": 0.055, + "words": [ + { + "text": "You", + "start": 58.28, + "end": 58.46, + "confidence": 0.029 + }, + { + "text": "want", + "start": 58.46, + "end": 58.6, + "confidence": 0.107 + }, + { + "text": "to", + "start": 58.6, + "end": 58.64, + "confidence": 0.376 + }, + { + "text": "hack", + "start": 58.64, + "end": 58.76, + "confidence": 0.0 + }, + { + "text": "me", + "start": 58.76, + "end": 58.96, + "confidence": 0.442 + }, + { + "text": "on", + "start": 58.96, + "end": 59.18, + "confidence": 0.266 + }, + { + "text": "that?", + "start": 59.18, + "end": 59.48, + "confidence": 0.186 + } + ] + }, + { + "id": 31, + "seek": 5500, + "start": 59.5, + "end": 61.96, + "text": " With the cover, I tried it already.", + "tokens": [ + 2022, + 264, + 2060, + 11, + 286, + 3031, + 309, + 1217, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.31608172647314137, + "compression_ratio": 1.8318181818181818, + "no_speech_prob": 0.00039152163662947714, + "confidence": 0.202, + "words": [ + { + "text": "With", + "start": 59.5, + "end": 60.1, + "confidence": 0.012 + }, + { + "text": "the", + "start": 60.1, + "end": 60.82, + "confidence": 0.238 + }, + { + "text": "cover,", + "start": 60.82, + "end": 61.3, + "confidence": 0.165 + }, + { + "text": "I", + "start": 61.3, + "end": 61.34, + "confidence": 0.826 + }, + { + "text": "tried", + "start": 61.34, + "end": 61.52, + "confidence": 0.019 + }, + { + "text": "it", + "start": 61.52, + "end": 61.72, + "confidence": 0.699 + }, + { + "text": "already.", + "start": 61.72, + "end": 61.96, + "confidence": 0.832 + } + ] + }, + { + "id": 32, + "seek": 5500, + "start": 62.56, + "end": 63.16, + "text": " Okay, fine.", + "tokens": [ + 1033, + 11, + 2489, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.31608172647314137, + "compression_ratio": 1.8318181818181818, + "no_speech_prob": 0.00039152163662947714, + "confidence": 0.542, + "words": [ + { + "text": "Okay,", + "start": 62.56, + "end": 62.98, + "confidence": 0.49 + }, + { + "text": "fine.", + "start": 62.98, + "end": 63.16, + "confidence": 0.601 + } + ] + }, + { + "id": 33, + "seek": 5500, + "start": 63.2, + "end": 64.16, + "text": " We weren't sure of that.", + "tokens": [ + 492, + 4999, + 380, + 988, + 295, + 300, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.31608172647314137, + "compression_ratio": 1.8318181818181818, + "no_speech_prob": 0.00039152163662947714, + "confidence": 0.75, + "words": [ + { + "text": "We", + "start": 63.2, + "end": 63.36, + "confidence": 0.468 + }, + { + "text": "weren't", + "start": 63.36, + "end": 63.6, + "confidence": 0.939 + }, + { + "text": "sure", + "start": 63.6, + "end": 63.8, + "confidence": 0.916 + }, + { + "text": "of", + "start": 63.8, + "end": 63.88, + "confidence": 0.594 + }, + { + "text": "that.", + "start": 63.88, + "end": 64.16, + "confidence": 0.771 + } + ] + }, + { + "id": 34, + "seek": 5500, + "start": 64.48, + "end": 65.14, + "text": " Just a suggestion.", + "tokens": [ + 1449, + 257, + 16541, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.31608172647314137, + "compression_ratio": 1.8318181818181818, + "no_speech_prob": 0.00039152163662947714, + "confidence": 0.163, + "words": [ + { + "text": "Just", + "start": 64.48, + "end": 64.64, + "confidence": 0.011 + }, + { + "text": "a", + "start": 64.64, + "end": 64.78, + "confidence": 0.428 + }, + { + "text": "suggestion.", + "start": 64.78, + "end": 65.14, + "confidence": 0.386 + } + ] + }, + { + "id": 35, + "seek": 5500, + "start": 65.16, + "end": 68.04, + "text": " We thought we'd, uh, say you could check it out.", + "tokens": [ + 492, + 1194, + 321, + 1116, + 11, + 2232, + 11, + 584, + 291, + 727, + 1520, + 309, + 484, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.31608172647314137, + "compression_ratio": 1.8318181818181818, + "no_speech_prob": 0.00039152163662947714, + "confidence": 0.546, + "words": [ + { + "text": "We", + "start": 65.16, + "end": 65.42, + "confidence": 0.164 + }, + { + "text": "thought", + "start": 65.42, + "end": 65.62, + "confidence": 0.835 + }, + { + "text": "we'd,", + "start": 65.62, + "end": 66.14, + "confidence": 0.391 + }, + { + "text": "uh,", + "start": 66.14, + "end": 66.96, + "confidence": 0.678 + }, + { + "text": "say", + "start": 66.96, + "end": 67.0, + "confidence": 0.181 + }, + { + "text": "you", + "start": 67.0, + "end": 67.14, + "confidence": 0.825 + }, + { + "text": "could", + "start": 67.14, + "end": 67.3, + "confidence": 0.715 + }, + { + "text": "check", + "start": 67.3, + "end": 67.44, + "confidence": 0.637 + }, + { + "text": "it", + "start": 67.44, + "end": 67.66, + "confidence": 0.982 + }, + { + "text": "out.", + "start": 67.66, + "end": 68.04, + "confidence": 0.908 + } + ] + }, + { + "id": 36, + "seek": 5500, + "start": 68.24, + "end": 69.46, + "text": " It's not much of an order to turn that.", + "tokens": [ + 467, + 311, + 406, + 709, + 295, + 364, + 1668, + 281, + 1261, + 300, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.31608172647314137, + "compression_ratio": 1.8318181818181818, + "no_speech_prob": 0.00039152163662947714, + "confidence": 0.139, + "words": [ + { + "text": "It's", + "start": 68.24, + "end": 68.46, + "confidence": 0.077 + }, + { + "text": "not", + "start": 68.46, + "end": 68.5, + "confidence": 0.09 + }, + { + "text": "much", + "start": 68.5, + "end": 68.64, + "confidence": 0.342 + }, + { + "text": "of", + "start": 68.64, + "end": 68.78, + "confidence": 0.388 + }, + { + "text": "an", + "start": 68.78, + "end": 68.9, + "confidence": 0.399 + }, + { + "text": "order", + "start": 68.9, + "end": 68.94, + "confidence": 0.018 + }, + { + "text": "to", + "start": 68.94, + "end": 69.14, + "confidence": 0.122 + }, + { + "text": "turn", + "start": 69.14, + "end": 69.18, + "confidence": 0.447 + }, + { + "text": "that.", + "start": 69.18, + "end": 69.46, + "confidence": 0.116 + } + ] + }, + { + "id": 37, + "seek": 5500, + "start": 70.38, + "end": 71.98, + "text": " So, uh, I guess we're going to come up with this.", + "tokens": [ + 407, + 11, + 2232, + 11, + 286, + 2041, + 321, + 434, + 516, + 281, + 808, + 493, + 365, + 341, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.31608172647314137, + "compression_ratio": 1.8318181818181818, + "no_speech_prob": 0.00039152163662947714, + "confidence": 0.449, + "words": [ + { + "text": "So,", + "start": 70.38, + "end": 70.42, + "confidence": 0.514 + }, + { + "text": "uh,", + "start": 70.42, + "end": 70.5, + "confidence": 0.38 + }, + { + "text": "I", + "start": 70.5, + "end": 70.54, + "confidence": 0.946 + }, + { + "text": "guess", + "start": 70.54, + "end": 70.8, + "confidence": 0.99 + }, + { + "text": "we're", + "start": 70.8, + "end": 71.1, + "confidence": 0.534 + }, + { + "text": "going", + "start": 71.1, + "end": 71.28, + "confidence": 0.106 + }, + { + "text": "to", + "start": 71.28, + "end": 71.42, + "confidence": 0.915 + }, + { + "text": "come", + "start": 71.42, + "end": 71.48, + "confidence": 0.48 + }, + { + "text": "up", + "start": 71.48, + "end": 71.68, + "confidence": 0.579 + }, + { + "text": "with", + "start": 71.68, + "end": 71.88, + "confidence": 0.809 + }, + { + "text": "this.", + "start": 71.88, + "end": 71.98, + "confidence": 0.166 + } + ] + }, + { + "id": 38, + "seek": 5500, + "start": 72.0, + "end": 72.8, + "text": " Let us know.", + "tokens": [ + 961, + 505, + 458, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.31608172647314137, + "compression_ratio": 1.8318181818181818, + "no_speech_prob": 0.00039152163662947714, + "confidence": 0.45, + "words": [ + { + "text": "Let", + "start": 72.0, + "end": 72.14, + "confidence": 0.221 + }, + { + "text": "us", + "start": 72.14, + "end": 72.3, + "confidence": 0.272 + }, + { + "text": "know.", + "start": 72.3, + "end": 72.8, + "confidence": 0.826 + } + ] + }, + { + "id": 39, + "seek": 5500, + "start": 72.82, + "end": 73.02, + "text": " Okay.", + "tokens": [ + 1033, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.31608172647314137, + "compression_ratio": 1.8318181818181818, + "no_speech_prob": 0.00039152163662947714, + "confidence": 0.049, + "words": [ + { + "text": "Okay.", + "start": 72.82, + "end": 73.02, + "confidence": 0.049 + } + ] + }, + { + "id": 40, + "seek": 5500, + "start": 74.2, + "end": 75.48, + "text": " No problem.", + "tokens": [ + 883, + 1154, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.31608172647314137, + "compression_ratio": 1.8318181818181818, + "no_speech_prob": 0.00039152163662947714, + "confidence": 0.077, + "words": [ + { + "text": "No", + "start": 74.2, + "end": 74.24, + "confidence": 0.005 + }, + { + "text": "problem.", + "start": 74.24, + "end": 75.48, + "confidence": 0.295 + } + ] + }, + { + "id": 41, + "seek": 5500, + "start": 75.72, + "end": 75.94, + "text": " Okay.", + "tokens": [ + 1033, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.31608172647314137, + "compression_ratio": 1.8318181818181818, + "no_speech_prob": 0.00039152163662947714, + "confidence": 0.263, + "words": [ + { + "text": "Okay.", + "start": 75.72, + "end": 75.94, + "confidence": 0.263 + } + ] + }, + { + "id": 42, + "seek": 5500, + "start": 75.96, + "end": 76.66, + "text": " No problem.", + "tokens": [ + 883, + 1154, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.31608172647314137, + "compression_ratio": 1.8318181818181818, + "no_speech_prob": 0.00039152163662947714, + "confidence": 0.588, + "words": [ + { + "text": "No", + "start": 75.96, + "end": 76.24, + "confidence": 0.447 + }, + { + "text": "problem.", + "start": 76.24, + "end": 76.66, + "confidence": 0.673 + } + ] + }, + { + "id": 43, + "seek": 5500, + "start": 78.42, + "end": 78.5, + "text": " No problem.", + "tokens": [ + 883, + 1154, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.31608172647314137, + "compression_ratio": 1.8318181818181818, + "no_speech_prob": 0.00039152163662947714, + "confidence": 0.031, + "words": [ + { + "text": "No", + "start": 78.42, + "end": 78.46, + "confidence": 0.032 + }, + { + "text": "problem.", + "start": 78.46, + "end": 78.5, + "confidence": 0.03 + } + ] + }, + { + "id": 44, + "seek": 5500, + "start": 78.5, + "end": 79.28, + "text": " No problem.", + "tokens": [ + 883, + 1154, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.31608172647314137, + "compression_ratio": 1.8318181818181818, + "no_speech_prob": 0.00039152163662947714, + "confidence": 0.013, + "words": [ + { + "text": "No", + "start": 78.5, + "end": 78.7, + "confidence": 0.001 + }, + { + "text": "problem.", + "start": 78.7, + "end": 79.28, + "confidence": 0.044 + } + ] + }, + { + "id": 45, + "seek": 5500, + "start": 79.3, + "end": 80.3, + "text": " No problem.", + "tokens": [ + 883, + 1154, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.31608172647314137, + "compression_ratio": 1.8318181818181818, + "no_speech_prob": 0.00039152163662947714, + "confidence": 0.017, + "words": [ + { + "text": "No", + "start": 79.3, + "end": 79.48, + "confidence": 0.002 + }, + { + "text": "problem.", + "start": 79.48, + "end": 80.3, + "confidence": 0.056 + } + ] + }, + { + "id": 46, + "seek": 8000, + "start": 80.32, + "end": 84.94, + "text": " No problem.", + "tokens": [ + 883, + 1154, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.3978840112686157, + "compression_ratio": 1.5217391304347827, + "no_speech_prob": 0.0009465877083130181, + "confidence": 0.029, + "words": [ + { + "text": "No", + "start": 80.32, + "end": 80.54, + "confidence": 0.004 + }, + { + "text": "problem.", + "start": 80.54, + "end": 84.94, + "confidence": 0.082 + } + ] + }, + { + "id": 47, + "seek": 8000, + "start": 85.24, + "end": 87.1, + "text": " No problem.", + "tokens": [ + 883, + 1154, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.3978840112686157, + "compression_ratio": 1.5217391304347827, + "no_speech_prob": 0.0009465877083130181, + "confidence": 0.03, + "words": [ + { + "text": "No", + "start": 85.24, + "end": 85.4, + "confidence": 0.002 + }, + { + "text": "problem.", + "start": 85.4, + "end": 87.1, + "confidence": 0.128 + } + ] + }, + { + "id": 48, + "seek": 8800, + "start": 87.52, + "end": 88.98, + "text": " No problem.", + "tokens": [ + 50364, + 883, + 1154, + 13, + 51464 + ], + "temperature": 0.0, + "avg_logprob": -0.649966835975647, + "compression_ratio": 0.5789473684210527, + "no_speech_prob": 0.0005261301412247121, + "confidence": 0.037, + "words": [ + { + "text": "No", + "start": 87.52, + "end": 88.9, + "confidence": 0.003 + }, + { + "text": "problem.", + "start": 88.9, + "end": 88.98, + "confidence": 0.137 + } + ] + } + ], + "language": "en" +} \ No newline at end of file diff --git a/tests/expected/naive.cuda/naive_apollo11.mp3.words.json b/tests/expected/naive.cuda/naive_apollo11.mp3.words.json new file mode 100644 index 0000000000000000000000000000000000000000..1d7628fb1df3720ce20a998436c90ebb59cb86c7 --- /dev/null +++ b/tests/expected/naive.cuda/naive_apollo11.mp3.words.json @@ -0,0 +1,3814 @@ +{ + "text": " Apollo 11, Houston we got a recommendation for you on your Soyuz-VA GLEME GVA. Alright, okay, we like to say that they make the one that's on the helmet we're going to have in B1. And you can put the other one on the mic helmet with those GVA blizzard frames. Alright, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them", + "segments": [ + { + "id": 0, + "seek": 0, + "start": 0.64, + "end": 6.84, + "text": " Apollo 11, Houston we got a recommendation for you on your Soyuz-VA GLEME GVA.", + "tokens": [ + 25187, + 2975, + 11, + 18717, + 321, + 658, + 257, + 11879, + 337, + 291, + 322, + 428, + 24758, + 3334, + 12, + 20914, + 460, + 2634, + 15454, + 460, + 20914, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.7235679626464844, + "compression_ratio": 1.39247311827957, + "no_speech_prob": 0.44993799924850464, + "confidence": 0.494, + "words": [ + { + "text": "Apollo", + "start": 0.64, + "end": 0.98, + "confidence": 0.425 + }, + { + "text": "11,", + "start": 0.98, + "end": 1.52, + "confidence": 0.842 + }, + { + "text": "Houston", + "start": 1.52, + "end": 1.78, + "confidence": 0.974 + }, + { + "text": "we", + "start": 1.78, + "end": 1.98, + "confidence": 0.453 + }, + { + "text": "got", + "start": 1.98, + "end": 2.16, + "confidence": 0.791 + }, + { + "text": "a", + "start": 2.16, + "end": 2.32, + "confidence": 0.992 + }, + { + "text": "recommendation", + "start": 2.32, + "end": 3.08, + "confidence": 0.97 + }, + { + "text": "for", + "start": 3.08, + "end": 3.5, + "confidence": 0.945 + }, + { + "text": "you", + "start": 3.5, + "end": 3.72, + "confidence": 0.99 + }, + { + "text": "on", + "start": 3.72, + "end": 4.2, + "confidence": 0.935 + }, + { + "text": "your", + "start": 4.2, + "end": 4.24, + "confidence": 0.974 + }, + { + "text": "Soyuz-VA", + "start": 4.24, + "end": 5.32, + "confidence": 0.327 + }, + { + "text": "GLEME", + "start": 5.32, + "end": 6.02, + "confidence": 0.178 + }, + { + "text": "GVA.", + "start": 6.02, + "end": 6.84, + "confidence": 0.321 + } + ] + }, + { + "id": 1, + "seek": 0, + "start": 10.82, + "end": 19.28, + "text": " Alright, okay, we like to say that they make the one that's on the helmet we're going to have in B1.", + "tokens": [ + 2798, + 11, + 1392, + 11, + 321, + 411, + 281, + 584, + 300, + 436, + 652, + 264, + 472, + 300, + 311, + 322, + 264, + 15922, + 321, + 434, + 516, + 281, + 362, + 294, + 363, + 16, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.7235679626464844, + "compression_ratio": 1.39247311827957, + "no_speech_prob": 0.44993799924850464, + "confidence": 0.335, + "words": [ + { + "text": "Alright,", + "start": 10.82, + "end": 12.06, + "confidence": 0.126 + }, + { + "text": "okay,", + "start": 12.06, + "end": 13.06, + "confidence": 0.394 + }, + { + "text": "we", + "start": 13.06, + "end": 13.1, + "confidence": 0.478 + }, + { + "text": "like", + "start": 13.1, + "end": 13.48, + "confidence": 0.493 + }, + { + "text": "to", + "start": 13.48, + "end": 13.66, + "confidence": 0.128 + }, + { + "text": "say", + "start": 13.66, + "end": 14.94, + "confidence": 0.084 + }, + { + "text": "that", + "start": 14.94, + "end": 15.54, + "confidence": 0.225 + }, + { + "text": "they", + "start": 15.54, + "end": 15.58, + "confidence": 0.328 + }, + { + "text": "make", + "start": 15.58, + "end": 15.78, + "confidence": 0.162 + }, + { + "text": "the", + "start": 15.78, + "end": 15.92, + "confidence": 0.226 + }, + { + "text": "one", + "start": 15.92, + "end": 16.1, + "confidence": 0.559 + }, + { + "text": "that's", + "start": 16.1, + "end": 16.36, + "confidence": 0.367 + }, + { + "text": "on", + "start": 16.36, + "end": 16.6, + "confidence": 0.387 + }, + { + "text": "the", + "start": 16.6, + "end": 16.84, + "confidence": 0.354 + }, + { + "text": "helmet", + "start": 16.84, + "end": 17.36, + "confidence": 0.205 + }, + { + "text": "we're", + "start": 17.36, + "end": 17.84, + "confidence": 0.297 + }, + { + "text": "going", + "start": 17.84, + "end": 18.04, + "confidence": 0.432 + }, + { + "text": "to", + "start": 18.04, + "end": 18.18, + "confidence": 0.448 + }, + { + "text": "have", + "start": 18.18, + "end": 18.24, + "confidence": 0.761 + }, + { + "text": "in", + "start": 18.24, + "end": 18.46, + "confidence": 0.743 + }, + { + "text": "B1.", + "start": 18.46, + "end": 19.28, + "confidence": 0.753 + } + ] + }, + { + "id": 2, + "seek": 0, + "start": 19.38, + "end": 24.7, + "text": " And you can put the other one on the mic helmet with those GVA blizzard frames.", + "tokens": [ + 400, + 291, + 393, + 829, + 264, + 661, + 472, + 322, + 264, + 3123, + 15922, + 365, + 729, + 460, + 20914, + 888, + 31062, + 12083, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.7235679626464844, + "compression_ratio": 1.39247311827957, + "no_speech_prob": 0.44993799924850464, + "confidence": 0.123, + "words": [ + { + "text": "And", + "start": 19.38, + "end": 20.14, + "confidence": 0.321 + }, + { + "text": "you", + "start": 20.14, + "end": 20.36, + "confidence": 0.904 + }, + { + "text": "can", + "start": 20.36, + "end": 20.54, + "confidence": 0.363 + }, + { + "text": "put", + "start": 20.54, + "end": 20.72, + "confidence": 0.939 + }, + { + "text": "the", + "start": 20.72, + "end": 20.86, + "confidence": 0.978 + }, + { + "text": "other", + "start": 20.86, + "end": 21.06, + "confidence": 0.995 + }, + { + "text": "one", + "start": 21.06, + "end": 21.26, + "confidence": 0.965 + }, + { + "text": "on", + "start": 21.26, + "end": 21.68, + "confidence": 0.961 + }, + { + "text": "the", + "start": 21.68, + "end": 21.74, + "confidence": 0.199 + }, + { + "text": "mic", + "start": 21.74, + "end": 22.58, + "confidence": 0.694 + }, + { + "text": "helmet", + "start": 22.58, + "end": 22.94, + "confidence": 0.007 + }, + { + "text": "with", + "start": 22.94, + "end": 23.2, + "confidence": 0.059 + }, + { + "text": "those", + "start": 23.2, + "end": 23.46, + "confidence": 0.046 + }, + { + "text": "GVA", + "start": 23.46, + "end": 23.86, + "confidence": 0.001 + }, + { + "text": "blizzard", + "start": 23.86, + "end": 24.32, + "confidence": 0.032 + }, + { + "text": "frames.", + "start": 24.32, + "end": 24.7, + "confidence": 0.231 + } + ] + }, + { + "id": 3, + "seek": 2500, + "start": 31.36, + "end": 54.68, + "text": " Alright, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them", + "tokens": [ + 50364, + 2798, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552 + ], + "temperature": 0.0, + "avg_logprob": -0.10793833414713541, + "compression_ratio": 24.096774193548388, + "no_speech_prob": 0.0011014570482075214, + "confidence": 0.887, + "words": [ + { + "text": "Alright,", + "start": 31.36, + "end": 31.98, + "confidence": 0.077 + }, + { + "text": "got", + "start": 31.98, + "end": 32.02, + "confidence": 0.169 + }, + { + "text": "them,", + "start": 32.02, + "end": 32.52, + "confidence": 0.189 + }, + { + "text": "got", + "start": 32.52, + "end": 33.0, + "confidence": 0.429 + }, + { + "text": "them,", + "start": 33.0, + "end": 33.78, + "confidence": 0.613 + }, + { + "text": "got", + "start": 33.78, + "end": 33.82, + "confidence": 0.67 + }, + { + "text": "them,", + "start": 33.82, + "end": 34.56, + "confidence": 0.495 + }, + { + "text": "got", + "start": 34.56, + "end": 34.74, + "confidence": 0.664 + }, + { + "text": "them,", + "start": 34.74, + "end": 34.78, + "confidence": 0.486 + }, + { + "text": "got", + "start": 34.78, + "end": 35.02, + "confidence": 0.756 + }, + { + "text": "them,", + "start": 35.02, + "end": 35.06, + "confidence": 0.565 + }, + { + "text": "got", + "start": 35.06, + "end": 35.1, + "confidence": 0.781 + }, + { + "text": "them,", + "start": 35.1, + "end": 35.14, + "confidence": 0.684 + }, + { + "text": "got", + "start": 35.14, + "end": 35.32, + "confidence": 0.858 + }, + { + "text": "them,", + "start": 35.32, + "end": 35.98, + "confidence": 0.803 + }, + { + "text": "got", + "start": 35.98, + "end": 36.02, + "confidence": 0.917 + }, + { + "text": "them,", + "start": 36.02, + "end": 36.06, + "confidence": 0.767 + }, + { + "text": "got", + "start": 36.06, + "end": 36.1, + "confidence": 0.584 + }, + { + "text": "them,", + "start": 36.1, + "end": 36.14, + "confidence": 0.843 + }, + { + "text": "got", + "start": 36.14, + "end": 36.18, + "confidence": 0.926 + }, + { + "text": "them,", + "start": 36.18, + "end": 36.22, + "confidence": 0.887 + }, + { + "text": "got", + "start": 36.22, + "end": 36.26, + "confidence": 0.936 + }, + { + "text": "them,", + "start": 36.26, + "end": 36.4, + "confidence": 0.903 + }, + { + "text": "got", + "start": 36.4, + "end": 36.44, + "confidence": 0.939 + }, + { + "text": "them,", + "start": 36.44, + "end": 36.48, + "confidence": 0.909 + }, + { + "text": "got", + "start": 36.48, + "end": 36.52, + "confidence": 0.948 + }, + { + "text": "them,", + "start": 36.52, + "end": 36.56, + "confidence": 0.902 + }, + { + "text": "got", + "start": 36.56, + "end": 36.6, + "confidence": 0.942 + }, + { + "text": "them,", + "start": 36.6, + "end": 36.64, + "confidence": 0.904 + }, + { + "text": "got", + "start": 36.64, + "end": 36.68, + "confidence": 0.938 + }, + { + "text": "them,", + "start": 36.68, + "end": 36.72, + "confidence": 0.911 + }, + { + "text": "got", + "start": 36.72, + "end": 36.76, + "confidence": 0.932 + }, + { + "text": "them,", + "start": 36.76, + "end": 36.8, + "confidence": 0.918 + }, + { + "text": "got", + "start": 36.8, + "end": 36.84, + "confidence": 0.932 + }, + { + "text": "them,", + "start": 36.84, + "end": 36.88, + "confidence": 0.923 + }, + { + "text": "got", + "start": 36.88, + "end": 36.92, + "confidence": 0.937 + }, + { + "text": "them,", + "start": 36.92, + "end": 36.96, + "confidence": 0.93 + }, + { + "text": "got", + "start": 36.96, + "end": 37.0, + "confidence": 0.938 + }, + { + "text": "them,", + "start": 37.0, + "end": 37.04, + "confidence": 0.936 + }, + { + "text": "got", + "start": 37.04, + "end": 37.08, + "confidence": 0.943 + }, + { + "text": "them,", + "start": 37.08, + "end": 37.12, + "confidence": 0.941 + }, + { + "text": "got", + "start": 37.12, + "end": 37.16, + "confidence": 0.945 + }, + { + "text": "them,", + "start": 37.16, + "end": 37.2, + "confidence": 0.944 + }, + { + "text": "got", + "start": 37.2, + "end": 37.24, + "confidence": 0.948 + }, + { + "text": "them,", + "start": 37.24, + "end": 37.28, + "confidence": 0.947 + }, + { + "text": "got", + "start": 37.28, + "end": 37.32, + "confidence": 0.949 + }, + { + "text": "them,", + "start": 37.32, + "end": 37.36, + "confidence": 0.95 + }, + { + "text": "got", + "start": 37.36, + "end": 37.4, + "confidence": 0.95 + }, + { + "text": "them,", + "start": 37.4, + "end": 37.44, + "confidence": 0.953 + }, + { + "text": "got", + "start": 37.44, + "end": 37.48, + "confidence": 0.951 + }, + { + "text": "them,", + "start": 37.48, + "end": 37.52, + "confidence": 0.956 + }, + { + "text": "got", + "start": 37.52, + "end": 37.56, + "confidence": 0.951 + }, + { + "text": "them,", + "start": 37.56, + "end": 37.6, + "confidence": 0.956 + }, + { + "text": "got", + "start": 37.6, + "end": 37.64, + "confidence": 0.953 + }, + { + "text": "them,", + "start": 37.64, + "end": 37.68, + "confidence": 0.957 + }, + { + "text": "got", + "start": 37.68, + "end": 37.72, + "confidence": 0.954 + }, + { + "text": "them,", + "start": 37.72, + "end": 37.76, + "confidence": 0.961 + }, + { + "text": "got", + "start": 37.76, + "end": 37.8, + "confidence": 0.954 + }, + { + "text": "them,", + "start": 37.8, + "end": 37.84, + "confidence": 0.961 + }, + { + "text": "got", + "start": 37.84, + "end": 37.88, + "confidence": 0.955 + }, + { + "text": "them,", + "start": 37.88, + "end": 37.92, + "confidence": 0.962 + }, + { + "text": "got", + "start": 37.92, + "end": 37.96, + "confidence": 0.955 + }, + { + "text": "them,", + "start": 37.96, + "end": 38.0, + "confidence": 0.964 + }, + { + "text": "got", + "start": 38.0, + "end": 38.04, + "confidence": 0.956 + }, + { + "text": "them,", + "start": 38.04, + "end": 38.08, + "confidence": 0.965 + }, + { + "text": "got", + "start": 38.08, + "end": 38.12, + "confidence": 0.957 + }, + { + "text": "them,", + "start": 38.12, + "end": 38.16, + "confidence": 0.965 + }, + { + "text": "got", + "start": 38.16, + "end": 38.2, + "confidence": 0.959 + }, + { + "text": "them,", + "start": 38.2, + "end": 38.24, + "confidence": 0.968 + }, + { + "text": "got", + "start": 38.24, + "end": 38.28, + "confidence": 0.961 + }, + { + "text": "them,", + "start": 38.28, + "end": 38.32, + "confidence": 0.969 + }, + { + "text": "got", + "start": 38.32, + "end": 38.36, + "confidence": 0.961 + }, + { + "text": "them,", + "start": 38.36, + "end": 38.4, + "confidence": 0.968 + }, + { + "text": "got", + "start": 38.4, + "end": 38.44, + "confidence": 0.963 + }, + { + "text": "them,", + "start": 38.44, + "end": 38.48, + "confidence": 0.971 + }, + { + "text": "got", + "start": 38.48, + "end": 38.52, + "confidence": 0.965 + }, + { + "text": "them,", + "start": 38.52, + "end": 38.56, + "confidence": 0.972 + }, + { + "text": "got", + "start": 38.56, + "end": 38.6, + "confidence": 0.966 + }, + { + "text": "them,", + "start": 38.6, + "end": 38.64, + "confidence": 0.974 + }, + { + "text": "got", + "start": 38.64, + "end": 38.68, + "confidence": 0.967 + }, + { + "text": "them,", + "start": 38.68, + "end": 38.72, + "confidence": 0.974 + }, + { + "text": "got", + "start": 38.72, + "end": 38.76, + "confidence": 0.969 + }, + { + "text": "them,", + "start": 38.76, + "end": 38.8, + "confidence": 0.974 + }, + { + "text": "got", + "start": 38.8, + "end": 38.84, + "confidence": 0.972 + }, + { + "text": "them,", + "start": 38.84, + "end": 38.88, + "confidence": 0.976 + }, + { + "text": "got", + "start": 38.88, + "end": 38.92, + "confidence": 0.974 + }, + { + "text": "them,", + "start": 38.92, + "end": 38.96, + "confidence": 0.978 + }, + { + "text": "got", + "start": 38.96, + "end": 39.0, + "confidence": 0.975 + }, + { + "text": "them,", + "start": 39.0, + "end": 39.04, + "confidence": 0.978 + }, + { + "text": "got", + "start": 39.04, + "end": 39.08, + "confidence": 0.977 + }, + { + "text": "them,", + "start": 39.08, + "end": 39.12, + "confidence": 0.979 + }, + { + "text": "got", + "start": 39.12, + "end": 39.16, + "confidence": 0.979 + }, + { + "text": "them,", + "start": 39.16, + "end": 39.2, + "confidence": 0.979 + }, + { + "text": "got", + "start": 39.2, + "end": 39.24, + "confidence": 0.981 + }, + { + "text": "them,", + "start": 39.24, + "end": 39.28, + "confidence": 0.981 + }, + { + "text": "got", + "start": 39.28, + "end": 39.32, + "confidence": 0.982 + }, + { + "text": "them,", + "start": 39.32, + "end": 39.36, + "confidence": 0.982 + }, + { + "text": "got", + "start": 39.36, + "end": 39.4, + "confidence": 0.983 + }, + { + "text": "them,", + "start": 39.4, + "end": 39.44, + "confidence": 0.983 + }, + { + "text": "got", + "start": 39.44, + "end": 39.48, + "confidence": 0.985 + }, + { + "text": "them,", + "start": 39.48, + "end": 39.52, + "confidence": 0.983 + }, + { + "text": "got", + "start": 39.52, + "end": 39.56, + "confidence": 0.987 + }, + { + "text": "them,", + "start": 39.56, + "end": 39.6, + "confidence": 0.983 + }, + { + "text": "got", + "start": 39.6, + "end": 39.64, + "confidence": 0.988 + }, + { + "text": "them,", + "start": 39.64, + "end": 39.68, + "confidence": 0.983 + }, + { + "text": "got", + "start": 39.68, + "end": 39.72, + "confidence": 0.989 + }, + { + "text": "them,", + "start": 39.72, + "end": 39.76, + "confidence": 0.985 + }, + { + "text": "got", + "start": 39.76, + "end": 39.8, + "confidence": 0.989 + }, + { + "text": "them,", + "start": 39.8, + "end": 39.84, + "confidence": 0.985 + }, + { + "text": "got", + "start": 39.84, + "end": 39.88, + "confidence": 0.99 + }, + { + "text": "them,", + "start": 39.88, + "end": 39.92, + "confidence": 0.985 + }, + { + "text": "got", + "start": 39.92, + "end": 39.96, + "confidence": 0.991 + }, + { + "text": "them,", + "start": 39.96, + "end": 40.0, + "confidence": 0.986 + }, + { + "text": "got", + "start": 40.0, + "end": 40.04, + "confidence": 0.991 + }, + { + "text": "them,", + "start": 40.04, + "end": 40.08, + "confidence": 0.986 + }, + { + "text": "got", + "start": 40.08, + "end": 40.12, + "confidence": 0.992 + }, + { + "text": "them,", + "start": 40.12, + "end": 40.16, + "confidence": 0.986 + }, + { + "text": "got", + "start": 40.16, + "end": 40.2, + "confidence": 0.992 + }, + { + "text": "them,", + "start": 40.2, + "end": 40.24, + "confidence": 0.987 + }, + { + "text": "got", + "start": 40.24, + "end": 40.28, + "confidence": 0.993 + }, + { + "text": "them,", + "start": 40.28, + "end": 40.32, + "confidence": 0.987 + }, + { + "text": "got", + "start": 40.32, + "end": 40.36, + "confidence": 0.993 + }, + { + "text": "them,", + "start": 40.36, + "end": 40.4, + "confidence": 0.987 + }, + { + "text": "got", + "start": 40.4, + "end": 40.44, + "confidence": 0.993 + }, + { + "text": "them,", + "start": 40.44, + "end": 40.48, + "confidence": 0.987 + }, + { + "text": "got", + "start": 40.48, + "end": 40.52, + "confidence": 0.994 + }, + { + "text": "them,", + "start": 40.52, + "end": 40.56, + "confidence": 0.988 + }, + { + "text": "got", + "start": 40.56, + "end": 40.6, + "confidence": 0.994 + }, + { + "text": "them,", + "start": 40.6, + "end": 40.64, + "confidence": 0.987 + }, + { + "text": "got", + "start": 40.64, + "end": 40.68, + "confidence": 0.994 + }, + { + "text": "them,", + "start": 40.68, + "end": 40.86, + "confidence": 0.989 + }, + { + "text": "got", + "start": 40.86, + "end": 40.9, + "confidence": 0.994 + }, + { + "text": "them,", + "start": 40.9, + "end": 40.94, + "confidence": 0.989 + }, + { + "text": "got", + "start": 40.94, + "end": 40.98, + "confidence": 0.994 + }, + { + "text": "them,", + "start": 40.98, + "end": 41.24, + "confidence": 0.989 + }, + { + "text": "got", + "start": 41.24, + "end": 41.36, + "confidence": 0.995 + }, + { + "text": "them,", + "start": 41.36, + "end": 42.3, + "confidence": 0.989 + }, + { + "text": "got", + "start": 42.3, + "end": 42.5, + "confidence": 0.994 + }, + { + "text": "them,", + "start": 42.5, + "end": 42.98, + "confidence": 0.989 + }, + { + "text": "got", + "start": 42.98, + "end": 44.02, + "confidence": 0.995 + }, + { + "text": "them,", + "start": 44.02, + "end": 44.42, + "confidence": 0.989 + }, + { + "text": "got", + "start": 44.42, + "end": 44.78, + "confidence": 0.995 + }, + { + "text": "them,", + "start": 44.78, + "end": 45.16, + "confidence": 0.989 + }, + { + "text": "got", + "start": 45.16, + "end": 46.22, + "confidence": 0.995 + }, + { + "text": "them,", + "start": 46.22, + "end": 46.52, + "confidence": 0.99 + }, + { + "text": "got", + "start": 46.52, + "end": 46.72, + "confidence": 0.995 + }, + { + "text": "them,", + "start": 46.72, + "end": 47.72, + "confidence": 0.99 + }, + { + "text": "got", + "start": 47.72, + "end": 48.58, + "confidence": 0.993 + }, + { + "text": "them", + "start": 48.58, + "end": 54.68, + "confidence": 0.996 + } + ] + }, + { + "id": 4, + "seek": 5500, + "start": 72.0, + "end": 84.66, + "text": " got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them", + "tokens": [ + 50364, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552 + ], + "temperature": 0.0, + "avg_logprob": -0.05313390894321048, + "compression_ratio": 29.52, + "no_speech_prob": 0.24548843502998352, + "confidence": 0.84, + "words": [ + { + "text": "got", + "start": 72.0, + "end": 72.04, + "confidence": 0.005 + }, + { + "text": "them,", + "start": 72.04, + "end": 72.08, + "confidence": 0.007 + }, + { + "text": "got", + "start": 72.08, + "end": 72.12, + "confidence": 0.049 + }, + { + "text": "them,", + "start": 72.12, + "end": 72.16, + "confidence": 0.35 + }, + { + "text": "got", + "start": 72.16, + "end": 72.2, + "confidence": 0.65 + }, + { + "text": "them,", + "start": 72.2, + "end": 72.24, + "confidence": 0.549 + }, + { + "text": "got", + "start": 72.24, + "end": 72.28, + "confidence": 0.837 + }, + { + "text": "them,", + "start": 72.28, + "end": 72.32, + "confidence": 0.614 + }, + { + "text": "got", + "start": 72.32, + "end": 72.36, + "confidence": 0.891 + }, + { + "text": "them,", + "start": 72.36, + "end": 72.4, + "confidence": 0.665 + }, + { + "text": "got", + "start": 72.4, + "end": 72.44, + "confidence": 0.909 + }, + { + "text": "them,", + "start": 72.44, + "end": 72.48, + "confidence": 0.689 + }, + { + "text": "got", + "start": 72.48, + "end": 72.52, + "confidence": 0.861 + }, + { + "text": "them,", + "start": 72.52, + "end": 72.56, + "confidence": 0.772 + }, + { + "text": "got", + "start": 72.56, + "end": 72.6, + "confidence": 0.91 + }, + { + "text": "them,", + "start": 72.6, + "end": 72.64, + "confidence": 0.84 + }, + { + "text": "got", + "start": 72.64, + "end": 72.68, + "confidence": 0.933 + }, + { + "text": "them,", + "start": 72.68, + "end": 72.72, + "confidence": 0.633 + }, + { + "text": "got", + "start": 72.72, + "end": 72.76, + "confidence": 0.173 + }, + { + "text": "them,", + "start": 72.76, + "end": 72.8, + "confidence": 0.776 + }, + { + "text": "got", + "start": 72.8, + "end": 72.84, + "confidence": 0.824 + }, + { + "text": "them,", + "start": 72.84, + "end": 72.88, + "confidence": 0.832 + }, + { + "text": "got", + "start": 72.88, + "end": 72.92, + "confidence": 0.846 + }, + { + "text": "them,", + "start": 72.92, + "end": 72.96, + "confidence": 0.849 + }, + { + "text": "got", + "start": 72.96, + "end": 73.0, + "confidence": 0.846 + }, + { + "text": "them,", + "start": 73.0, + "end": 73.04, + "confidence": 0.867 + }, + { + "text": "got", + "start": 73.04, + "end": 73.08, + "confidence": 0.87 + }, + { + "text": "them,", + "start": 73.08, + "end": 73.12, + "confidence": 0.893 + }, + { + "text": "got", + "start": 73.12, + "end": 73.16, + "confidence": 0.902 + }, + { + "text": "them,", + "start": 73.16, + "end": 73.2, + "confidence": 0.905 + }, + { + "text": "got", + "start": 73.2, + "end": 73.24, + "confidence": 0.898 + }, + { + "text": "them,", + "start": 73.24, + "end": 73.28, + "confidence": 0.906 + }, + { + "text": "got", + "start": 73.28, + "end": 73.32, + "confidence": 0.876 + }, + { + "text": "them,", + "start": 73.32, + "end": 73.36, + "confidence": 0.916 + }, + { + "text": "got", + "start": 73.36, + "end": 73.4, + "confidence": 0.885 + }, + { + "text": "them,", + "start": 73.4, + "end": 73.44, + "confidence": 0.923 + }, + { + "text": "got", + "start": 73.44, + "end": 73.48, + "confidence": 0.892 + }, + { + "text": "them,", + "start": 73.48, + "end": 73.52, + "confidence": 0.931 + }, + { + "text": "got", + "start": 73.52, + "end": 73.56, + "confidence": 0.902 + }, + { + "text": "them,", + "start": 73.56, + "end": 73.6, + "confidence": 0.935 + }, + { + "text": "got", + "start": 73.6, + "end": 73.64, + "confidence": 0.908 + }, + { + "text": "them,", + "start": 73.64, + "end": 73.68, + "confidence": 0.941 + }, + { + "text": "got", + "start": 73.68, + "end": 73.72, + "confidence": 0.912 + }, + { + "text": "them,", + "start": 73.72, + "end": 73.76, + "confidence": 0.944 + }, + { + "text": "got", + "start": 73.76, + "end": 73.8, + "confidence": 0.918 + }, + { + "text": "them,", + "start": 73.8, + "end": 73.84, + "confidence": 0.948 + }, + { + "text": "got", + "start": 73.84, + "end": 73.88, + "confidence": 0.923 + }, + { + "text": "them,", + "start": 73.88, + "end": 73.92, + "confidence": 0.95 + }, + { + "text": "got", + "start": 73.92, + "end": 73.96, + "confidence": 0.926 + }, + { + "text": "them,", + "start": 73.96, + "end": 74.0, + "confidence": 0.953 + }, + { + "text": "got", + "start": 74.0, + "end": 74.04, + "confidence": 0.927 + }, + { + "text": "them,", + "start": 74.04, + "end": 74.08, + "confidence": 0.956 + }, + { + "text": "got", + "start": 74.08, + "end": 74.12, + "confidence": 0.927 + }, + { + "text": "them,", + "start": 74.12, + "end": 74.16, + "confidence": 0.956 + }, + { + "text": "got", + "start": 74.16, + "end": 74.2, + "confidence": 0.928 + }, + { + "text": "them,", + "start": 74.2, + "end": 74.24, + "confidence": 0.957 + }, + { + "text": "got", + "start": 74.24, + "end": 74.28, + "confidence": 0.93 + }, + { + "text": "them,", + "start": 74.28, + "end": 74.32, + "confidence": 0.959 + }, + { + "text": "got", + "start": 74.32, + "end": 74.36, + "confidence": 0.93 + }, + { + "text": "them,", + "start": 74.36, + "end": 74.4, + "confidence": 0.96 + }, + { + "text": "got", + "start": 74.4, + "end": 74.44, + "confidence": 0.931 + }, + { + "text": "them,", + "start": 74.44, + "end": 74.48, + "confidence": 0.961 + }, + { + "text": "got", + "start": 74.48, + "end": 74.52, + "confidence": 0.933 + }, + { + "text": "them,", + "start": 74.52, + "end": 74.56, + "confidence": 0.962 + }, + { + "text": "got", + "start": 74.56, + "end": 74.6, + "confidence": 0.933 + }, + { + "text": "them,", + "start": 74.6, + "end": 74.64, + "confidence": 0.963 + }, + { + "text": "got", + "start": 74.64, + "end": 74.68, + "confidence": 0.934 + }, + { + "text": "them,", + "start": 74.68, + "end": 74.72, + "confidence": 0.963 + }, + { + "text": "got", + "start": 74.72, + "end": 74.76, + "confidence": 0.935 + }, + { + "text": "them,", + "start": 74.76, + "end": 74.8, + "confidence": 0.964 + }, + { + "text": "got", + "start": 74.8, + "end": 74.84, + "confidence": 0.937 + }, + { + "text": "them,", + "start": 74.84, + "end": 74.88, + "confidence": 0.964 + }, + { + "text": "got", + "start": 74.88, + "end": 74.92, + "confidence": 0.939 + }, + { + "text": "them,", + "start": 74.92, + "end": 74.96, + "confidence": 0.965 + }, + { + "text": "got", + "start": 74.96, + "end": 75.0, + "confidence": 0.941 + }, + { + "text": "them,", + "start": 75.0, + "end": 75.04, + "confidence": 0.966 + }, + { + "text": "got", + "start": 75.04, + "end": 75.08, + "confidence": 0.943 + }, + { + "text": "them,", + "start": 75.08, + "end": 75.12, + "confidence": 0.967 + }, + { + "text": "got", + "start": 75.12, + "end": 75.16, + "confidence": 0.945 + }, + { + "text": "them,", + "start": 75.16, + "end": 75.2, + "confidence": 0.968 + }, + { + "text": "got", + "start": 75.2, + "end": 75.24, + "confidence": 0.946 + }, + { + "text": "them,", + "start": 75.24, + "end": 75.28, + "confidence": 0.968 + }, + { + "text": "got", + "start": 75.28, + "end": 75.32, + "confidence": 0.949 + }, + { + "text": "them,", + "start": 75.32, + "end": 75.36, + "confidence": 0.969 + }, + { + "text": "got", + "start": 75.36, + "end": 75.4, + "confidence": 0.952 + }, + { + "text": "them,", + "start": 75.4, + "end": 75.44, + "confidence": 0.969 + }, + { + "text": "got", + "start": 75.44, + "end": 75.48, + "confidence": 0.954 + }, + { + "text": "them,", + "start": 75.48, + "end": 75.52, + "confidence": 0.97 + }, + { + "text": "got", + "start": 75.52, + "end": 75.56, + "confidence": 0.957 + }, + { + "text": "them,", + "start": 75.56, + "end": 75.6, + "confidence": 0.971 + }, + { + "text": "got", + "start": 75.6, + "end": 75.64, + "confidence": 0.96 + }, + { + "text": "them,", + "start": 75.64, + "end": 75.68, + "confidence": 0.973 + }, + { + "text": "got", + "start": 75.68, + "end": 75.72, + "confidence": 0.963 + }, + { + "text": "them,", + "start": 75.72, + "end": 75.76, + "confidence": 0.973 + }, + { + "text": "got", + "start": 75.76, + "end": 75.8, + "confidence": 0.965 + }, + { + "text": "them,", + "start": 75.8, + "end": 75.84, + "confidence": 0.973 + }, + { + "text": "got", + "start": 75.84, + "end": 75.88, + "confidence": 0.967 + }, + { + "text": "them,", + "start": 75.88, + "end": 75.92, + "confidence": 0.973 + }, + { + "text": "got", + "start": 75.92, + "end": 75.96, + "confidence": 0.969 + }, + { + "text": "them,", + "start": 75.96, + "end": 76.0, + "confidence": 0.975 + }, + { + "text": "got", + "start": 76.0, + "end": 76.04, + "confidence": 0.971 + }, + { + "text": "them,", + "start": 76.04, + "end": 76.08, + "confidence": 0.975 + }, + { + "text": "got", + "start": 76.08, + "end": 76.12, + "confidence": 0.972 + }, + { + "text": "them,", + "start": 76.12, + "end": 76.16, + "confidence": 0.976 + }, + { + "text": "got", + "start": 76.16, + "end": 76.2, + "confidence": 0.975 + }, + { + "text": "them,", + "start": 76.2, + "end": 76.24, + "confidence": 0.976 + }, + { + "text": "got", + "start": 76.24, + "end": 76.28, + "confidence": 0.975 + }, + { + "text": "them,", + "start": 76.28, + "end": 76.32, + "confidence": 0.975 + }, + { + "text": "got", + "start": 76.32, + "end": 76.36, + "confidence": 0.977 + }, + { + "text": "them,", + "start": 76.36, + "end": 76.4, + "confidence": 0.977 + }, + { + "text": "got", + "start": 76.4, + "end": 76.44, + "confidence": 0.978 + }, + { + "text": "them,", + "start": 76.44, + "end": 76.48, + "confidence": 0.977 + }, + { + "text": "got", + "start": 76.48, + "end": 76.52, + "confidence": 0.98 + }, + { + "text": "them,", + "start": 76.52, + "end": 76.56, + "confidence": 0.978 + }, + { + "text": "got", + "start": 76.56, + "end": 76.6, + "confidence": 0.981 + }, + { + "text": "them,", + "start": 76.6, + "end": 76.64, + "confidence": 0.978 + }, + { + "text": "got", + "start": 76.64, + "end": 76.68, + "confidence": 0.982 + }, + { + "text": "them,", + "start": 76.68, + "end": 76.72, + "confidence": 0.979 + }, + { + "text": "got", + "start": 76.72, + "end": 76.76, + "confidence": 0.982 + }, + { + "text": "them,", + "start": 76.76, + "end": 76.8, + "confidence": 0.978 + }, + { + "text": "got", + "start": 76.8, + "end": 76.84, + "confidence": 0.983 + }, + { + "text": "them,", + "start": 76.84, + "end": 76.88, + "confidence": 0.98 + }, + { + "text": "got", + "start": 76.88, + "end": 76.92, + "confidence": 0.984 + }, + { + "text": "them,", + "start": 76.92, + "end": 76.96, + "confidence": 0.98 + }, + { + "text": "got", + "start": 76.96, + "end": 77.0, + "confidence": 0.985 + }, + { + "text": "them,", + "start": 77.0, + "end": 77.04, + "confidence": 0.98 + }, + { + "text": "got", + "start": 77.04, + "end": 77.08, + "confidence": 0.986 + }, + { + "text": "them,", + "start": 77.08, + "end": 77.12, + "confidence": 0.98 + }, + { + "text": "got", + "start": 77.12, + "end": 77.16, + "confidence": 0.986 + }, + { + "text": "them,", + "start": 77.16, + "end": 77.2, + "confidence": 0.98 + }, + { + "text": "got", + "start": 77.2, + "end": 77.24, + "confidence": 0.987 + }, + { + "text": "them,", + "start": 77.24, + "end": 77.28, + "confidence": 0.981 + }, + { + "text": "got", + "start": 77.28, + "end": 77.32, + "confidence": 0.988 + }, + { + "text": "them,", + "start": 77.32, + "end": 77.36, + "confidence": 0.982 + }, + { + "text": "got", + "start": 77.36, + "end": 77.4, + "confidence": 0.988 + }, + { + "text": "them,", + "start": 77.4, + "end": 77.44, + "confidence": 0.983 + }, + { + "text": "got", + "start": 77.44, + "end": 77.48, + "confidence": 0.989 + }, + { + "text": "them,", + "start": 77.48, + "end": 77.52, + "confidence": 0.982 + }, + { + "text": "got", + "start": 77.52, + "end": 77.56, + "confidence": 0.99 + }, + { + "text": "them,", + "start": 77.56, + "end": 77.6, + "confidence": 0.984 + }, + { + "text": "got", + "start": 77.6, + "end": 77.64, + "confidence": 0.99 + }, + { + "text": "them,", + "start": 77.64, + "end": 78.74, + "confidence": 0.983 + }, + { + "text": "got", + "start": 78.74, + "end": 78.8, + "confidence": 0.991 + }, + { + "text": "them,", + "start": 78.8, + "end": 79.8, + "confidence": 0.984 + }, + { + "text": "got", + "start": 79.8, + "end": 80.08, + "confidence": 0.991 + }, + { + "text": "them,", + "start": 80.08, + "end": 83.98, + "confidence": 0.984 + }, + { + "text": "got", + "start": 83.98, + "end": 84.16, + "confidence": 0.991 + }, + { + "text": "them", + "start": 84.16, + "end": 84.66, + "confidence": 0.994 + } + ] + }, + { + "id": 5, + "seek": 8500, + "start": 84.68, + "end": 94.48, + "text": " got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them", + "tokens": [ + 50364, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552 + ], + "temperature": 0.0, + "avg_logprob": -0.04979915789959142, + "compression_ratio": 29.52, + "no_speech_prob": 0.6971050500869751, + "confidence": 0.848, + "words": [ + { + "text": "got", + "start": 84.68, + "end": 85.42, + "confidence": 0.0 + }, + { + "text": "them,", + "start": 85.42, + "end": 85.92, + "confidence": 0.023 + }, + { + "text": "got", + "start": 85.92, + "end": 86.74, + "confidence": 0.821 + }, + { + "text": "them,", + "start": 86.74, + "end": 87.2, + "confidence": 0.604 + }, + { + "text": "got", + "start": 87.2, + "end": 88.62, + "confidence": 0.84 + }, + { + "text": "them,", + "start": 88.62, + "end": 88.66, + "confidence": 0.451 + }, + { + "text": "got", + "start": 88.66, + "end": 88.84, + "confidence": 0.887 + }, + { + "text": "them,", + "start": 88.84, + "end": 88.88, + "confidence": 0.382 + }, + { + "text": "got", + "start": 88.88, + "end": 88.92, + "confidence": 0.902 + }, + { + "text": "them,", + "start": 88.92, + "end": 88.96, + "confidence": 0.353 + }, + { + "text": "got", + "start": 88.96, + "end": 89.0, + "confidence": 0.896 + }, + { + "text": "them,", + "start": 89.0, + "end": 89.04, + "confidence": 0.352 + }, + { + "text": "got", + "start": 89.04, + "end": 89.08, + "confidence": 0.869 + }, + { + "text": "them,", + "start": 89.08, + "end": 89.12, + "confidence": 0.423 + }, + { + "text": "got", + "start": 89.12, + "end": 89.16, + "confidence": 0.889 + }, + { + "text": "them,", + "start": 89.16, + "end": 89.2, + "confidence": 0.528 + }, + { + "text": "got", + "start": 89.2, + "end": 89.24, + "confidence": 0.91 + }, + { + "text": "them,", + "start": 89.24, + "end": 89.28, + "confidence": 0.619 + }, + { + "text": "got", + "start": 89.28, + "end": 89.32, + "confidence": 0.65 + }, + { + "text": "them,", + "start": 89.32, + "end": 89.36, + "confidence": 0.71 + }, + { + "text": "got", + "start": 89.36, + "end": 89.4, + "confidence": 0.835 + }, + { + "text": "them,", + "start": 89.4, + "end": 89.44, + "confidence": 0.815 + }, + { + "text": "got", + "start": 89.44, + "end": 89.48, + "confidence": 0.908 + }, + { + "text": "them,", + "start": 89.48, + "end": 89.52, + "confidence": 0.874 + }, + { + "text": "got", + "start": 89.52, + "end": 89.56, + "confidence": 0.925 + }, + { + "text": "them,", + "start": 89.56, + "end": 89.6, + "confidence": 0.907 + }, + { + "text": "got", + "start": 89.6, + "end": 89.64, + "confidence": 0.941 + }, + { + "text": "them,", + "start": 89.64, + "end": 89.68, + "confidence": 0.927 + }, + { + "text": "got", + "start": 89.68, + "end": 89.72, + "confidence": 0.951 + }, + { + "text": "them,", + "start": 89.72, + "end": 89.76, + "confidence": 0.941 + }, + { + "text": "got", + "start": 89.76, + "end": 89.8, + "confidence": 0.956 + }, + { + "text": "them,", + "start": 89.8, + "end": 89.84, + "confidence": 0.942 + }, + { + "text": "got", + "start": 89.84, + "end": 89.88, + "confidence": 0.957 + }, + { + "text": "them,", + "start": 89.88, + "end": 89.92, + "confidence": 0.943 + }, + { + "text": "got", + "start": 89.92, + "end": 89.96, + "confidence": 0.95 + }, + { + "text": "them,", + "start": 89.96, + "end": 90.0, + "confidence": 0.945 + }, + { + "text": "got", + "start": 90.0, + "end": 90.04, + "confidence": 0.945 + }, + { + "text": "them,", + "start": 90.04, + "end": 90.08, + "confidence": 0.952 + }, + { + "text": "got", + "start": 90.08, + "end": 90.12, + "confidence": 0.946 + }, + { + "text": "them,", + "start": 90.12, + "end": 90.16, + "confidence": 0.955 + }, + { + "text": "got", + "start": 90.16, + "end": 90.2, + "confidence": 0.947 + }, + { + "text": "them,", + "start": 90.2, + "end": 90.24, + "confidence": 0.961 + }, + { + "text": "got", + "start": 90.24, + "end": 90.28, + "confidence": 0.946 + }, + { + "text": "them,", + "start": 90.28, + "end": 90.32, + "confidence": 0.964 + }, + { + "text": "got", + "start": 90.32, + "end": 90.36, + "confidence": 0.949 + }, + { + "text": "them,", + "start": 90.36, + "end": 90.4, + "confidence": 0.967 + }, + { + "text": "got", + "start": 90.4, + "end": 90.44, + "confidence": 0.952 + }, + { + "text": "them,", + "start": 90.44, + "end": 90.48, + "confidence": 0.97 + }, + { + "text": "got", + "start": 90.48, + "end": 90.52, + "confidence": 0.954 + }, + { + "text": "them,", + "start": 90.52, + "end": 90.56, + "confidence": 0.973 + }, + { + "text": "got", + "start": 90.56, + "end": 90.6, + "confidence": 0.954 + }, + { + "text": "them,", + "start": 90.6, + "end": 90.64, + "confidence": 0.977 + }, + { + "text": "got", + "start": 90.64, + "end": 90.68, + "confidence": 0.953 + }, + { + "text": "them,", + "start": 90.68, + "end": 90.72, + "confidence": 0.977 + }, + { + "text": "got", + "start": 90.72, + "end": 90.76, + "confidence": 0.953 + }, + { + "text": "them,", + "start": 90.76, + "end": 90.8, + "confidence": 0.978 + }, + { + "text": "got", + "start": 90.8, + "end": 90.84, + "confidence": 0.955 + }, + { + "text": "them,", + "start": 90.84, + "end": 90.88, + "confidence": 0.979 + }, + { + "text": "got", + "start": 90.88, + "end": 90.92, + "confidence": 0.956 + }, + { + "text": "them,", + "start": 90.92, + "end": 90.96, + "confidence": 0.981 + }, + { + "text": "got", + "start": 90.96, + "end": 91.0, + "confidence": 0.957 + }, + { + "text": "them,", + "start": 91.0, + "end": 91.04, + "confidence": 0.981 + }, + { + "text": "got", + "start": 91.04, + "end": 91.08, + "confidence": 0.958 + }, + { + "text": "them,", + "start": 91.08, + "end": 91.12, + "confidence": 0.982 + }, + { + "text": "got", + "start": 91.12, + "end": 91.16, + "confidence": 0.958 + }, + { + "text": "them,", + "start": 91.16, + "end": 91.2, + "confidence": 0.983 + }, + { + "text": "got", + "start": 91.2, + "end": 91.24, + "confidence": 0.959 + }, + { + "text": "them,", + "start": 91.24, + "end": 91.28, + "confidence": 0.983 + }, + { + "text": "got", + "start": 91.28, + "end": 91.32, + "confidence": 0.96 + }, + { + "text": "them,", + "start": 91.32, + "end": 91.36, + "confidence": 0.984 + }, + { + "text": "got", + "start": 91.36, + "end": 91.4, + "confidence": 0.962 + }, + { + "text": "them,", + "start": 91.4, + "end": 91.44, + "confidence": 0.983 + }, + { + "text": "got", + "start": 91.44, + "end": 91.48, + "confidence": 0.964 + }, + { + "text": "them,", + "start": 91.48, + "end": 91.52, + "confidence": 0.985 + }, + { + "text": "got", + "start": 91.52, + "end": 91.56, + "confidence": 0.965 + }, + { + "text": "them,", + "start": 91.56, + "end": 91.6, + "confidence": 0.985 + }, + { + "text": "got", + "start": 91.6, + "end": 91.64, + "confidence": 0.967 + }, + { + "text": "them,", + "start": 91.64, + "end": 91.68, + "confidence": 0.986 + }, + { + "text": "got", + "start": 91.68, + "end": 91.72, + "confidence": 0.969 + }, + { + "text": "them,", + "start": 91.72, + "end": 91.76, + "confidence": 0.986 + }, + { + "text": "got", + "start": 91.76, + "end": 91.8, + "confidence": 0.969 + }, + { + "text": "them,", + "start": 91.8, + "end": 91.84, + "confidence": 0.987 + }, + { + "text": "got", + "start": 91.84, + "end": 91.88, + "confidence": 0.972 + }, + { + "text": "them,", + "start": 91.88, + "end": 91.92, + "confidence": 0.987 + }, + { + "text": "got", + "start": 91.92, + "end": 91.96, + "confidence": 0.974 + }, + { + "text": "them,", + "start": 91.96, + "end": 92.0, + "confidence": 0.987 + }, + { + "text": "got", + "start": 92.0, + "end": 92.04, + "confidence": 0.975 + }, + { + "text": "them,", + "start": 92.04, + "end": 92.08, + "confidence": 0.988 + }, + { + "text": "got", + "start": 92.08, + "end": 92.12, + "confidence": 0.977 + }, + { + "text": "them,", + "start": 92.12, + "end": 92.16, + "confidence": 0.988 + }, + { + "text": "got", + "start": 92.16, + "end": 92.2, + "confidence": 0.979 + }, + { + "text": "them,", + "start": 92.2, + "end": 92.24, + "confidence": 0.989 + }, + { + "text": "got", + "start": 92.24, + "end": 92.28, + "confidence": 0.981 + }, + { + "text": "them,", + "start": 92.28, + "end": 92.32, + "confidence": 0.989 + }, + { + "text": "got", + "start": 92.32, + "end": 92.36, + "confidence": 0.982 + }, + { + "text": "them,", + "start": 92.36, + "end": 92.4, + "confidence": 0.989 + }, + { + "text": "got", + "start": 92.4, + "end": 92.44, + "confidence": 0.984 + }, + { + "text": "them,", + "start": 92.44, + "end": 92.48, + "confidence": 0.989 + }, + { + "text": "got", + "start": 92.48, + "end": 92.52, + "confidence": 0.985 + }, + { + "text": "them,", + "start": 92.52, + "end": 92.56, + "confidence": 0.99 + }, + { + "text": "got", + "start": 92.56, + "end": 92.6, + "confidence": 0.986 + }, + { + "text": "them,", + "start": 92.6, + "end": 92.64, + "confidence": 0.991 + }, + { + "text": "got", + "start": 92.64, + "end": 92.68, + "confidence": 0.987 + }, + { + "text": "them,", + "start": 92.68, + "end": 92.72, + "confidence": 0.991 + }, + { + "text": "got", + "start": 92.72, + "end": 92.76, + "confidence": 0.989 + }, + { + "text": "them,", + "start": 92.76, + "end": 92.8, + "confidence": 0.991 + }, + { + "text": "got", + "start": 92.8, + "end": 92.84, + "confidence": 0.989 + }, + { + "text": "them,", + "start": 92.84, + "end": 92.88, + "confidence": 0.991 + }, + { + "text": "got", + "start": 92.88, + "end": 92.92, + "confidence": 0.99 + }, + { + "text": "them,", + "start": 92.92, + "end": 92.96, + "confidence": 0.992 + }, + { + "text": "got", + "start": 92.96, + "end": 93.0, + "confidence": 0.991 + }, + { + "text": "them,", + "start": 93.0, + "end": 93.04, + "confidence": 0.992 + }, + { + "text": "got", + "start": 93.04, + "end": 93.08, + "confidence": 0.992 + }, + { + "text": "them,", + "start": 93.08, + "end": 93.12, + "confidence": 0.992 + }, + { + "text": "got", + "start": 93.12, + "end": 93.16, + "confidence": 0.992 + }, + { + "text": "them,", + "start": 93.16, + "end": 93.2, + "confidence": 0.993 + }, + { + "text": "got", + "start": 93.2, + "end": 93.24, + "confidence": 0.993 + }, + { + "text": "them,", + "start": 93.24, + "end": 93.28, + "confidence": 0.993 + }, + { + "text": "got", + "start": 93.28, + "end": 93.32, + "confidence": 0.993 + }, + { + "text": "them,", + "start": 93.32, + "end": 93.36, + "confidence": 0.993 + }, + { + "text": "got", + "start": 93.36, + "end": 93.4, + "confidence": 0.993 + }, + { + "text": "them,", + "start": 93.4, + "end": 93.44, + "confidence": 0.993 + }, + { + "text": "got", + "start": 93.44, + "end": 93.48, + "confidence": 0.993 + }, + { + "text": "them,", + "start": 93.48, + "end": 93.52, + "confidence": 0.994 + }, + { + "text": "got", + "start": 93.52, + "end": 93.56, + "confidence": 0.993 + }, + { + "text": "them,", + "start": 93.56, + "end": 93.6, + "confidence": 0.994 + }, + { + "text": "got", + "start": 93.6, + "end": 93.64, + "confidence": 0.994 + }, + { + "text": "them,", + "start": 93.64, + "end": 93.68, + "confidence": 0.993 + }, + { + "text": "got", + "start": 93.68, + "end": 93.72, + "confidence": 0.994 + }, + { + "text": "them,", + "start": 93.72, + "end": 93.76, + "confidence": 0.994 + }, + { + "text": "got", + "start": 93.76, + "end": 93.8, + "confidence": 0.994 + }, + { + "text": "them,", + "start": 93.8, + "end": 93.84, + "confidence": 0.994 + }, + { + "text": "got", + "start": 93.84, + "end": 93.88, + "confidence": 0.994 + }, + { + "text": "them,", + "start": 93.88, + "end": 93.92, + "confidence": 0.994 + }, + { + "text": "got", + "start": 93.92, + "end": 93.96, + "confidence": 0.994 + }, + { + "text": "them,", + "start": 93.96, + "end": 94.0, + "confidence": 0.994 + }, + { + "text": "got", + "start": 94.0, + "end": 94.04, + "confidence": 0.994 + }, + { + "text": "them,", + "start": 94.04, + "end": 94.08, + "confidence": 0.994 + }, + { + "text": "got", + "start": 94.08, + "end": 94.12, + "confidence": 0.995 + }, + { + "text": "them,", + "start": 94.12, + "end": 94.16, + "confidence": 0.995 + }, + { + "text": "got", + "start": 94.16, + "end": 94.2, + "confidence": 0.994 + }, + { + "text": "them,", + "start": 94.2, + "end": 94.24, + "confidence": 0.994 + }, + { + "text": "got", + "start": 94.24, + "end": 94.28, + "confidence": 0.995 + }, + { + "text": "them,", + "start": 94.28, + "end": 94.32, + "confidence": 0.994 + }, + { + "text": "got", + "start": 94.32, + "end": 94.36, + "confidence": 0.995 + }, + { + "text": "them,", + "start": 94.36, + "end": 94.4, + "confidence": 0.994 + }, + { + "text": "got", + "start": 94.4, + "end": 94.44, + "confidence": 0.995 + }, + { + "text": "them", + "start": 94.44, + "end": 94.48, + "confidence": 0.998 + } + ] + } + ], + "language": "en" +} \ No newline at end of file diff --git a/tests/expected/naive/accurate_apollo11.mp3.words.json b/tests/expected/naive/accurate_apollo11.mp3.words.json new file mode 100644 index 0000000000000000000000000000000000000000..1f11dd18ce3fb73e4522e0caf68bd4780a40a3f3 --- /dev/null +++ b/tests/expected/naive/accurate_apollo11.mp3.words.json @@ -0,0 +1,2288 @@ +{ + "text": " Apollo 11, Houston, we got a recommendation for you on your Soyuz-EA GLEM-E-G-E-A. All right. Okay. Yeah, sir. Yeah, sir. Let's take that camera. Let's say it makes it want to go on the helmet we were going to have in B-1. The other one. And you can put the other one on the mic helmet. We'll show it to you in a quick screen. Over. All right. Yeah, sir. All right. Yeah, sir. There's a better helmet than B-1. That's the other one. Nice. Let's go in there. At least we're safe. We've got them in there. Helmet bags. And, uh, I guess we have helmets in the helmet bag. At least it's in the helmet bag. Right here. Right here. Yeah, we're taking it next day. Yeah, we're taking it next day. We're gonna hang me on the cover. I tried it already. Okay, fine. We weren't sure that, uh, just a suggestion. We thought we'd, uh, that you could check it out. It's not much of an order, sir. And so, uh, I guess we're gonna come up with this. Let us know. Okay. No problem. Okay. No problem. No problem. No worry. None. Thank you.", + "segments": [ + { + "id": 0, + "seek": 0, + "start": 0.54, + "end": 6.66, + "text": " Apollo 11, Houston, we got a recommendation for you on your Soyuz-EA GLEM-E-G-E-A.", + "tokens": [ + 50364, + 25187, + 2975, + 11, + 18717, + 11, + 321, + 658, + 257, + 11879, + 337, + 291, + 322, + 428, + 24758, + 3334, + 12, + 36, + 32, + 460, + 2634, + 44, + 12, + 36, + 12, + 38, + 12, + 36, + 12, + 32, + 13, + 50714 + ], + "temperature": 0.0, + "avg_logprob": -0.5319976806640625, + "compression_ratio": 1.4690265486725664, + "no_speech_prob": 0.44995221495628357, + "confidence": 0.578, + "words": [ + { + "text": "Apollo", + "start": 0.54, + "end": 0.92, + "confidence": 0.425 + }, + { + "text": "11,", + "start": 0.92, + "end": 1.26, + "confidence": 0.842 + }, + { + "text": "Houston,", + "start": 1.52, + "end": 1.72, + "confidence": 0.665 + }, + { + "text": "we", + "start": 1.9, + "end": 1.94, + "confidence": 0.983 + }, + { + "text": "got", + "start": 1.94, + "end": 2.1, + "confidence": 0.743 + }, + { + "text": "a", + "start": 2.1, + "end": 2.26, + "confidence": 0.993 + }, + { + "text": "recommendation", + "start": 2.26, + "end": 2.86, + "confidence": 0.977 + }, + { + "text": "for", + "start": 2.86, + "end": 3.44, + "confidence": 0.94 + }, + { + "text": "you", + "start": 3.44, + "end": 3.6, + "confidence": 0.993 + }, + { + "text": "on", + "start": 3.6, + "end": 3.74, + "confidence": 0.918 + }, + { + "text": "your", + "start": 3.74, + "end": 3.94, + "confidence": 0.976 + }, + { + "text": "Soyuz-EA", + "start": 3.94, + "end": 5.26, + "confidence": 0.455 + }, + { + "text": "GLEM-E-G-E-A.", + "start": 5.26, + "end": 6.66, + "confidence": 0.436 + } + ] + }, + { + "id": 1, + "seek": 0, + "start": 10.8, + "end": 11.08, + "text": " All right.", + "tokens": [ + 50714, + 1057, + 558, + 13, + 50914 + ], + "temperature": 0.0, + "avg_logprob": -0.5319976806640625, + "compression_ratio": 1.4690265486725664, + "no_speech_prob": 0.44995221495628357, + "confidence": 0.14, + "words": [ + { + "text": "All", + "start": 10.8, + "end": 10.82, + "confidence": 0.005 + }, + { + "text": "right.", + "start": 10.82, + "end": 11.08, + "confidence": 0.747 + } + ] + }, + { + "id": 2, + "seek": 0, + "start": 12.2, + "end": 12.22, + "text": " Okay.", + "tokens": [ + 50914, + 1033, + 13, + 50964 + ], + "temperature": 0.0, + "avg_logprob": -0.5319976806640625, + "compression_ratio": 1.4690265486725664, + "no_speech_prob": 0.44995221495628357, + "confidence": 0.287, + "words": [ + { + "text": "Okay.", + "start": 12.2, + "end": 12.22, + "confidence": 0.287 + } + ] + }, + { + "id": 3, + "seek": 0, + "start": 12.22, + "end": 13.38, + "text": " Yeah, sir.", + "tokens": [ + 50964, + 865, + 11, + 4735, + 13, + 51014 + ], + "temperature": 0.0, + "avg_logprob": -0.5319976806640625, + "compression_ratio": 1.4690265486725664, + "no_speech_prob": 0.44995221495628357, + "confidence": 0.124, + "words": [ + { + "text": "Yeah,", + "start": 12.22, + "end": 12.64, + "confidence": 0.113 + }, + { + "text": "sir.", + "start": 12.76, + "end": 13.38, + "confidence": 0.137 + } + ] + }, + { + "id": 4, + "seek": 0, + "start": 13.38, + "end": 13.92, + "text": " Yeah, sir.", + "tokens": [ + 51014, + 865, + 11, + 4735, + 13, + 51064 + ], + "temperature": 0.0, + "avg_logprob": -0.5319976806640625, + "compression_ratio": 1.4690265486725664, + "no_speech_prob": 0.44995221495628357, + "confidence": 0.048, + "words": [ + { + "text": "Yeah,", + "start": 13.38, + "end": 13.48, + "confidence": 0.089 + }, + { + "text": "sir.", + "start": 13.64, + "end": 13.92, + "confidence": 0.026 + } + ] + }, + { + "id": 5, + "seek": 0, + "start": 13.92, + "end": 14.52, + "text": " Let's take that camera.", + "tokens": [ + 51064, + 961, + 311, + 747, + 300, + 2799, + 13, + 51114 + ], + "temperature": 0.0, + "avg_logprob": -0.5319976806640625, + "compression_ratio": 1.4690265486725664, + "no_speech_prob": 0.44995221495628357, + "confidence": 0.054, + "words": [ + { + "text": "Let's", + "start": 13.92, + "end": 14.04, + "confidence": 0.035 + }, + { + "text": "take", + "start": 14.04, + "end": 14.14, + "confidence": 0.027 + }, + { + "text": "that", + "start": 14.14, + "end": 14.22, + "confidence": 0.037 + }, + { + "text": "camera.", + "start": 14.22, + "end": 14.52, + "confidence": 0.14 + } + ] + }, + { + "id": 6, + "seek": 0, + "start": 14.52, + "end": 19.08, + "text": " Let's say it makes it want to go on the helmet we were going to have in B-1.", + "tokens": [ + 51114, + 961, + 311, + 584, + 309, + 1669, + 309, + 528, + 281, + 352, + 322, + 264, + 15922, + 321, + 645, + 516, + 281, + 362, + 294, + 363, + 12, + 16, + 13, + 51314 + ], + "temperature": 0.0, + "avg_logprob": -0.5319976806640625, + "compression_ratio": 1.4690265486725664, + "no_speech_prob": 0.44995221495628357, + "confidence": 0.29, + "words": [ + { + "text": "Let's", + "start": 14.52, + "end": 14.82, + "confidence": 0.124 + }, + { + "text": "say", + "start": 14.82, + "end": 14.98, + "confidence": 0.29 + }, + { + "text": "it", + "start": 14.98, + "end": 15.04, + "confidence": 0.029 + }, + { + "text": "makes", + "start": 15.04, + "end": 15.64, + "confidence": 0.633 + }, + { + "text": "it", + "start": 15.64, + "end": 15.86, + "confidence": 0.948 + }, + { + "text": "want", + "start": 15.86, + "end": 16.08, + "confidence": 0.249 + }, + { + "text": "to", + "start": 16.08, + "end": 16.18, + "confidence": 0.969 + }, + { + "text": "go", + "start": 16.18, + "end": 16.38, + "confidence": 0.816 + }, + { + "text": "on", + "start": 16.38, + "end": 16.6, + "confidence": 0.935 + }, + { + "text": "the", + "start": 16.6, + "end": 16.76, + "confidence": 0.449 + }, + { + "text": "helmet", + "start": 16.76, + "end": 17.24, + "confidence": 0.003 + }, + { + "text": "we", + "start": 17.24, + "end": 17.54, + "confidence": 0.019 + }, + { + "text": "were", + "start": 17.54, + "end": 17.78, + "confidence": 0.181 + }, + { + "text": "going", + "start": 17.78, + "end": 17.96, + "confidence": 0.637 + }, + { + "text": "to", + "start": 17.96, + "end": 18.12, + "confidence": 0.965 + }, + { + "text": "have", + "start": 18.12, + "end": 18.18, + "confidence": 0.967 + }, + { + "text": "in", + "start": 18.18, + "end": 18.36, + "confidence": 0.902 + }, + { + "text": "B-1.", + "start": 18.36, + "end": 19.08, + "confidence": 0.471 + } + ] + }, + { + "id": 7, + "seek": 0, + "start": 19.08, + "end": 19.84, + "text": " The other one.", + "tokens": [ + 51314, + 440, + 661, + 472, + 13, + 51364 + ], + "temperature": 0.0, + "avg_logprob": -0.5319976806640625, + "compression_ratio": 1.4690265486725664, + "no_speech_prob": 0.44995221495628357, + "confidence": 0.126, + "words": [ + { + "text": "The", + "start": 19.08, + "end": 19.38, + "confidence": 0.004 + }, + { + "text": "other", + "start": 19.38, + "end": 19.62, + "confidence": 0.141 + }, + { + "text": "one.", + "start": 19.62, + "end": 19.84, + "confidence": 0.691 + } + ] + }, + { + "id": 8, + "seek": 0, + "start": 20.04, + "end": 22.8, + "text": " And you can put the other one on the mic helmet.", + "tokens": [ + 51364, + 400, + 291, + 393, + 829, + 264, + 661, + 472, + 322, + 264, + 3123, + 15922, + 13, + 51514 + ], + "temperature": 0.0, + "avg_logprob": -0.5319976806640625, + "compression_ratio": 1.4690265486725664, + "no_speech_prob": 0.44995221495628357, + "confidence": 0.405, + "words": [ + { + "text": "And", + "start": 20.04, + "end": 20.22, + "confidence": 0.344 + }, + { + "text": "you", + "start": 20.22, + "end": 20.32, + "confidence": 0.892 + }, + { + "text": "can", + "start": 20.32, + "end": 20.48, + "confidence": 0.126 + }, + { + "text": "put", + "start": 20.48, + "end": 20.64, + "confidence": 0.894 + }, + { + "text": "the", + "start": 20.64, + "end": 20.84, + "confidence": 0.979 + }, + { + "text": "other", + "start": 20.84, + "end": 21.0, + "confidence": 0.996 + }, + { + "text": "one", + "start": 21.0, + "end": 21.18, + "confidence": 0.972 + }, + { + "text": "on", + "start": 21.18, + "end": 21.38, + "confidence": 0.969 + }, + { + "text": "the", + "start": 21.38, + "end": 21.66, + "confidence": 0.09 + }, + { + "text": "mic", + "start": 21.66, + "end": 22.48, + "confidence": 0.616 + }, + { + "text": "helmet.", + "start": 22.48, + "end": 22.8, + "confidence": 0.105 + } + ] + }, + { + "id": 9, + "seek": 0, + "start": 22.8, + "end": 24.36, + "text": " We'll show it to you in a quick screen.", + "tokens": [ + 51514, + 492, + 603, + 855, + 309, + 281, + 291, + 294, + 257, + 1702, + 2568, + 13, + 51614 + ], + "temperature": 0.0, + "avg_logprob": -0.5319976806640625, + "compression_ratio": 1.4690265486725664, + "no_speech_prob": 0.44995221495628357, + "confidence": 0.121, + "words": [ + { + "text": "We'll", + "start": 22.8, + "end": 23.02, + "confidence": 0.08 + }, + { + "text": "show", + "start": 23.02, + "end": 23.24, + "confidence": 0.013 + }, + { + "text": "it", + "start": 23.24, + "end": 23.36, + "confidence": 0.12 + }, + { + "text": "to", + "start": 23.36, + "end": 23.52, + "confidence": 0.356 + }, + { + "text": "you", + "start": 23.52, + "end": 23.64, + "confidence": 0.609 + }, + { + "text": "in", + "start": 23.64, + "end": 23.86, + "confidence": 0.287 + }, + { + "text": "a", + "start": 23.86, + "end": 23.88, + "confidence": 0.723 + }, + { + "text": "quick", + "start": 23.88, + "end": 24.04, + "confidence": 0.016 + }, + { + "text": "screen.", + "start": 24.04, + "end": 24.36, + "confidence": 0.109 + } + ] + }, + { + "id": 10, + "seek": 0, + "start": 24.84, + "end": 25.1, + "text": " Over.", + "tokens": [ + 51614, + 4886, + 13, + 51664 + ], + "temperature": 0.0, + "avg_logprob": -0.5319976806640625, + "compression_ratio": 1.4690265486725664, + "no_speech_prob": 0.44995221495628357, + "confidence": 0.062, + "words": [ + { + "text": "Over.", + "start": 24.84, + "end": 25.1, + "confidence": 0.062 + } + ] + }, + { + "id": 11, + "seek": 2600, + "start": 31.32, + "end": 31.36, + "text": " All right.", + "tokens": [ + 50364, + 1057, + 558, + 13, + 50614 + ], + "temperature": 0.0, + "avg_logprob": -0.5039673957271852, + "compression_ratio": 1.9243243243243244, + "no_speech_prob": 0.08131810277700424, + "confidence": 0.108, + "words": [ + { + "text": "All", + "start": 31.32, + "end": 31.34, + "confidence": 0.003 + }, + { + "text": "right.", + "start": 31.34, + "end": 31.36, + "confidence": 0.677 + } + ] + }, + { + "id": 12, + "seek": 2600, + "start": 31.36, + "end": 32.06, + "text": " Yeah, sir.", + "tokens": [ + 50614, + 865, + 11, + 4735, + 13, + 50664 + ], + "temperature": 0.0, + "avg_logprob": -0.5039673957271852, + "compression_ratio": 1.9243243243243244, + "no_speech_prob": 0.08131810277700424, + "confidence": 0.035, + "words": [ + { + "text": "Yeah,", + "start": 31.36, + "end": 31.56, + "confidence": 0.033 + }, + { + "text": "sir.", + "start": 31.56, + "end": 32.06, + "confidence": 0.036 + } + ] + }, + { + "id": 13, + "seek": 2600, + "start": 32.26, + "end": 33.0, + "text": " All right.", + "tokens": [ + 50664, + 1057, + 558, + 13, + 50714 + ], + "temperature": 0.0, + "avg_logprob": -0.5039673957271852, + "compression_ratio": 1.9243243243243244, + "no_speech_prob": 0.08131810277700424, + "confidence": 0.201, + "words": [ + { + "text": "All", + "start": 32.26, + "end": 32.86, + "confidence": 0.022 + }, + { + "text": "right.", + "start": 32.86, + "end": 33.0, + "confidence": 0.607 + } + ] + }, + { + "id": 14, + "seek": 2600, + "start": 33.0, + "end": 33.5, + "text": " Yeah, sir.", + "tokens": [ + 50714, + 865, + 11, + 4735, + 13, + 50764 + ], + "temperature": 0.0, + "avg_logprob": -0.5039673957271852, + "compression_ratio": 1.9243243243243244, + "no_speech_prob": 0.08131810277700424, + "confidence": 0.044, + "words": [ + { + "text": "Yeah,", + "start": 33.0, + "end": 33.16, + "confidence": 0.208 + }, + { + "text": "sir.", + "start": 33.22, + "end": 33.5, + "confidence": 0.009 + } + ] + }, + { + "id": 15, + "seek": 2600, + "start": 33.5, + "end": 34.98, + "text": " There's a better helmet than B-1.", + "tokens": [ + 50764, + 821, + 311, + 257, + 1101, + 15922, + 813, + 363, + 12, + 16, + 13, + 50814 + ], + "temperature": 0.0, + "avg_logprob": -0.5039673957271852, + "compression_ratio": 1.9243243243243244, + "no_speech_prob": 0.08131810277700424, + "confidence": 0.04, + "words": [ + { + "text": "There's", + "start": 33.5, + "end": 33.9, + "confidence": 0.022 + }, + { + "text": "a", + "start": 33.9, + "end": 33.92, + "confidence": 0.264 + }, + { + "text": "better", + "start": 33.92, + "end": 33.94, + "confidence": 0.227 + }, + { + "text": "helmet", + "start": 33.94, + "end": 34.2, + "confidence": 0.004 + }, + { + "text": "than", + "start": 34.2, + "end": 34.6, + "confidence": 0.352 + }, + { + "text": "B-1.", + "start": 34.6, + "end": 34.98, + "confidence": 0.022 + } + ] + }, + { + "id": 16, + "seek": 2600, + "start": 35.0, + "end": 35.8, + "text": " That's the other one.", + "tokens": [ + 50814, + 663, + 311, + 264, + 661, + 472, + 13, + 50864 + ], + "temperature": 0.0, + "avg_logprob": -0.5039673957271852, + "compression_ratio": 1.9243243243243244, + "no_speech_prob": 0.08131810277700424, + "confidence": 0.277, + "words": [ + { + "text": "That's", + "start": 35.0, + "end": 35.38, + "confidence": 0.161 + }, + { + "text": "the", + "start": 35.38, + "end": 35.48, + "confidence": 0.514 + }, + { + "text": "other", + "start": 35.48, + "end": 35.6, + "confidence": 0.965 + }, + { + "text": "one.", + "start": 35.6, + "end": 35.8, + "confidence": 0.189 + } + ] + }, + { + "id": 17, + "seek": 2600, + "start": 35.8, + "end": 36.04, + "text": " Nice.", + "tokens": [ + 50864, + 5490, + 13, + 50914 + ], + "temperature": 0.0, + "avg_logprob": -0.5039673957271852, + "compression_ratio": 1.9243243243243244, + "no_speech_prob": 0.08131810277700424, + "confidence": 0.011, + "words": [ + { + "text": "Nice.", + "start": 35.8, + "end": 36.04, + "confidence": 0.011 + } + ] + }, + { + "id": 18, + "seek": 2600, + "start": 37.62, + "end": 38.38, + "text": " Let's go in there.", + "tokens": [ + 50914, + 961, + 311, + 352, + 294, + 456, + 13, + 50964 + ], + "temperature": 0.0, + "avg_logprob": -0.5039673957271852, + "compression_ratio": 1.9243243243243244, + "no_speech_prob": 0.08131810277700424, + "confidence": 0.125, + "words": [ + { + "text": "Let's", + "start": 37.62, + "end": 38.1, + "confidence": 0.022 + }, + { + "text": "go", + "start": 38.1, + "end": 38.12, + "confidence": 0.626 + }, + { + "text": "in", + "start": 38.12, + "end": 38.26, + "confidence": 0.037 + }, + { + "text": "there.", + "start": 38.26, + "end": 38.38, + "confidence": 0.579 + } + ] + }, + { + "id": 19, + "seek": 2600, + "start": 38.38, + "end": 39.2, + "text": " At least we're safe.", + "tokens": [ + 50964, + 1711, + 1935, + 321, + 434, + 3273, + 13, + 51014 + ], + "temperature": 0.0, + "avg_logprob": -0.5039673957271852, + "compression_ratio": 1.9243243243243244, + "no_speech_prob": 0.08131810277700424, + "confidence": 0.107, + "words": [ + { + "text": "At", + "start": 38.38, + "end": 38.44, + "confidence": 0.003 + }, + { + "text": "least", + "start": 38.44, + "end": 38.72, + "confidence": 0.125 + }, + { + "text": "we're", + "start": 38.72, + "end": 38.98, + "confidence": 0.091 + }, + { + "text": "safe.", + "start": 38.98, + "end": 39.2, + "confidence": 0.715 + } + ] + }, + { + "id": 20, + "seek": 2600, + "start": 39.88, + "end": 40.54, + "text": " We've got them in there.", + "tokens": [ + 51014, + 492, + 600, + 658, + 552, + 294, + 456, + 13, + 51064 + ], + "temperature": 0.0, + "avg_logprob": -0.5039673957271852, + "compression_ratio": 1.9243243243243244, + "no_speech_prob": 0.08131810277700424, + "confidence": 0.077, + "words": [ + { + "text": "We've", + "start": 39.88, + "end": 40.36, + "confidence": 0.055 + }, + { + "text": "got", + "start": 40.36, + "end": 40.48, + "confidence": 0.749 + }, + { + "text": "them", + "start": 40.48, + "end": 40.5, + "confidence": 0.003 + }, + { + "text": "in", + "start": 40.5, + "end": 40.52, + "confidence": 0.053 + }, + { + "text": "there.", + "start": 40.52, + "end": 40.54, + "confidence": 0.211 + } + ] + }, + { + "id": 21, + "seek": 2600, + "start": 40.54, + "end": 41.04, + "text": " Helmet bags.", + "tokens": [ + 51064, + 6128, + 5537, + 10405, + 13, + 51114 + ], + "temperature": 0.0, + "avg_logprob": -0.5039673957271852, + "compression_ratio": 1.9243243243243244, + "no_speech_prob": 0.08131810277700424, + "confidence": 0.001, + "words": [ + { + "text": "Helmet", + "start": 40.54, + "end": 40.66, + "confidence": 0.001 + }, + { + "text": "bags.", + "start": 40.66, + "end": 41.04, + "confidence": 0.002 + } + ] + }, + { + "id": 22, + "seek": 2600, + "start": 43.18, + "end": 47.4, + "text": " And, uh, I guess we have helmets in the helmet bag.", + "tokens": [ + 51114, + 400, + 11, + 2232, + 11, + 286, + 2041, + 321, + 362, + 42022, + 294, + 264, + 15922, + 3411, + 13, + 51464 + ], + "temperature": 0.0, + "avg_logprob": -0.5039673957271852, + "compression_ratio": 1.9243243243243244, + "no_speech_prob": 0.08131810277700424, + "confidence": 0.175, + "words": [ + { + "text": "And,", + "start": 43.18, + "end": 43.2, + "confidence": 0.052 + }, + { + "text": "uh,", + "start": 43.48, + "end": 43.74, + "confidence": 0.745 + }, + { + "text": "I", + "start": 43.86, + "end": 44.04, + "confidence": 0.341 + }, + { + "text": "guess", + "start": 44.04, + "end": 44.2, + "confidence": 0.283 + }, + { + "text": "we", + "start": 44.2, + "end": 44.52, + "confidence": 0.055 + }, + { + "text": "have", + "start": 44.52, + "end": 45.48, + "confidence": 0.053 + }, + { + "text": "helmets", + "start": 45.48, + "end": 46.5, + "confidence": 0.005 + }, + { + "text": "in", + "start": 46.5, + "end": 46.72, + "confidence": 0.216 + }, + { + "text": "the", + "start": 46.72, + "end": 46.92, + "confidence": 0.619 + }, + { + "text": "helmet", + "start": 46.92, + "end": 47.08, + "confidence": 0.831 + }, + { + "text": "bag.", + "start": 47.08, + "end": 47.4, + "confidence": 0.329 + } + ] + }, + { + "id": 23, + "seek": 2600, + "start": 48.2, + "end": 49.52, + "text": " At least it's in the helmet bag.", + "tokens": [ + 51464, + 1711, + 1935, + 309, + 311, + 294, + 264, + 15922, + 3411, + 13, + 51564 + ], + "temperature": 0.0, + "avg_logprob": -0.5039673957271852, + "compression_ratio": 1.9243243243243244, + "no_speech_prob": 0.08131810277700424, + "confidence": 0.122, + "words": [ + { + "text": "At", + "start": 48.2, + "end": 48.34, + "confidence": 0.095 + }, + { + "text": "least", + "start": 48.34, + "end": 48.6, + "confidence": 0.76 + }, + { + "text": "it's", + "start": 48.6, + "end": 48.86, + "confidence": 0.339 + }, + { + "text": "in", + "start": 48.86, + "end": 48.96, + "confidence": 0.151 + }, + { + "text": "the", + "start": 48.96, + "end": 49.1, + "confidence": 0.223 + }, + { + "text": "helmet", + "start": 49.1, + "end": 49.18, + "confidence": 0.006 + }, + { + "text": "bag.", + "start": 49.18, + "end": 49.52, + "confidence": 0.06 + } + ] + }, + { + "id": 24, + "seek": 2600, + "start": 49.52, + "end": 50.38, + "text": " Right here.", + "tokens": [ + 51564, + 1779, + 510, + 13, + 51614 + ], + "temperature": 0.0, + "avg_logprob": -0.5039673957271852, + "compression_ratio": 1.9243243243243244, + "no_speech_prob": 0.08131810277700424, + "confidence": 0.059, + "words": [ + { + "text": "Right", + "start": 49.52, + "end": 49.62, + "confidence": 0.027 + }, + { + "text": "here.", + "start": 49.62, + "end": 50.38, + "confidence": 0.088 + } + ] + }, + { + "id": 25, + "seek": 2600, + "start": 51.52, + "end": 51.98, + "text": " Right here.", + "tokens": [ + 51614, + 1779, + 510, + 13, + 51664 + ], + "temperature": 0.0, + "avg_logprob": -0.5039673957271852, + "compression_ratio": 1.9243243243243244, + "no_speech_prob": 0.08131810277700424, + "confidence": 0.017, + "words": [ + { + "text": "Right", + "start": 51.52, + "end": 51.72, + "confidence": 0.001 + }, + { + "text": "here.", + "start": 51.72, + "end": 51.98, + "confidence": 0.067 + } + ] + }, + { + "id": 26, + "seek": 2600, + "start": 51.98, + "end": 52.74, + "text": " Yeah, we're taking it next day.", + "tokens": [ + 51664, + 865, + 11, + 321, + 434, + 1940, + 309, + 958, + 786, + 13, + 51714 + ], + "temperature": 0.0, + "avg_logprob": -0.5039673957271852, + "compression_ratio": 1.9243243243243244, + "no_speech_prob": 0.08131810277700424, + "confidence": 0.047, + "words": [ + { + "text": "Yeah,", + "start": 51.98, + "end": 52.28, + "confidence": 0.043 + }, + { + "text": "we're", + "start": 52.28, + "end": 52.3, + "confidence": 0.288 + }, + { + "text": "taking", + "start": 52.3, + "end": 52.32, + "confidence": 0.005 + }, + { + "text": "it", + "start": 52.32, + "end": 52.34, + "confidence": 0.052 + }, + { + "text": "next", + "start": 52.34, + "end": 52.52, + "confidence": 0.002 + }, + { + "text": "day.", + "start": 52.52, + "end": 52.74, + "confidence": 0.113 + } + ] + }, + { + "id": 27, + "seek": 2600, + "start": 52.74, + "end": 54.1, + "text": " Yeah, we're taking it next day.", + "tokens": [ + 51714, + 865, + 11, + 321, + 434, + 1940, + 309, + 958, + 786, + 13, + 51764 + ], + "temperature": 0.0, + "avg_logprob": -0.5039673957271852, + "compression_ratio": 1.9243243243243244, + "no_speech_prob": 0.08131810277700424, + "confidence": 0.41, + "words": [ + { + "text": "Yeah,", + "start": 52.74, + "end": 53.24, + "confidence": 0.601 + }, + { + "text": "we're", + "start": 53.34, + "end": 53.44, + "confidence": 0.703 + }, + { + "text": "taking", + "start": 53.44, + "end": 53.62, + "confidence": 0.261 + }, + { + "text": "it", + "start": 53.62, + "end": 53.76, + "confidence": 0.247 + }, + { + "text": "next", + "start": 53.76, + "end": 53.88, + "confidence": 0.405 + }, + { + "text": "day.", + "start": 53.88, + "end": 54.1, + "confidence": 0.266 + } + ] + }, + { + "id": 28, + "seek": 5400, + "start": 56.68, + "end": 58.34, + "text": " We're gonna hang me on the cover.", + "tokens": [ + 50364, + 492, + 434, + 799, + 3967, + 385, + 322, + 264, + 2060, + 13, + 50614 + ], + "temperature": 0.6000000000000001, + "avg_logprob": -0.46983818116226816, + "compression_ratio": 1.5763546798029557, + "no_speech_prob": 0.2010825127363205, + "confidence": 0.117, + "words": [ + { + "text": "We're", + "start": 56.68, + "end": 56.8, + "confidence": 0.047 + }, + { + "text": "gonna", + "start": 56.8, + "end": 57.12, + "confidence": 0.472 + }, + { + "text": "hang", + "start": 57.12, + "end": 57.36, + "confidence": 0.421 + }, + { + "text": "me", + "start": 57.36, + "end": 57.58, + "confidence": 0.657 + }, + { + "text": "on", + "start": 57.58, + "end": 57.74, + "confidence": 0.88 + }, + { + "text": "the", + "start": 57.74, + "end": 57.88, + "confidence": 0.115 + }, + { + "text": "cover.", + "start": 57.88, + "end": 58.34, + "confidence": 0.012 + } + ] + }, + { + "id": 29, + "seek": 5400, + "start": 61.3, + "end": 61.8, + "text": " I tried it already.", + "tokens": [ + 50614, + 286, + 3031, + 309, + 1217, + 13, + 50764 + ], + "temperature": 0.6000000000000001, + "avg_logprob": -0.46983818116226816, + "compression_ratio": 1.5763546798029557, + "no_speech_prob": 0.2010825127363205, + "confidence": 0.042, + "words": [ + { + "text": "I", + "start": 61.3, + "end": 61.32, + "confidence": 0.095 + }, + { + "text": "tried", + "start": 61.32, + "end": 61.34, + "confidence": 0.0 + }, + { + "text": "it", + "start": 61.34, + "end": 61.44, + "confidence": 0.078 + }, + { + "text": "already.", + "start": 61.44, + "end": 61.8, + "confidence": 0.365 + } + ] + }, + { + "id": 30, + "seek": 5400, + "start": 62.52, + "end": 63.06, + "text": " Okay, fine.", + "tokens": [ + 50764, + 1033, + 11, + 2489, + 13, + 50814 + ], + "temperature": 0.6000000000000001, + "avg_logprob": -0.46983818116226816, + "compression_ratio": 1.5763546798029557, + "no_speech_prob": 0.2010825127363205, + "confidence": 0.482, + "words": [ + { + "text": "Okay,", + "start": 62.52, + "end": 62.76, + "confidence": 0.39 + }, + { + "text": "fine.", + "start": 62.88, + "end": 63.06, + "confidence": 0.595 + } + ] + }, + { + "id": 31, + "seek": 5400, + "start": 63.06, + "end": 65.1, + "text": " We weren't sure that, uh, just a suggestion.", + "tokens": [ + 50814, + 492, + 4999, + 380, + 988, + 300, + 11, + 2232, + 11, + 445, + 257, + 16541, + 13, + 50914 + ], + "temperature": 0.6000000000000001, + "avg_logprob": -0.46983818116226816, + "compression_ratio": 1.5763546798029557, + "no_speech_prob": 0.2010825127363205, + "confidence": 0.489, + "words": [ + { + "text": "We", + "start": 63.06, + "end": 63.26, + "confidence": 0.274 + }, + { + "text": "weren't", + "start": 63.26, + "end": 63.58, + "confidence": 0.918 + }, + { + "text": "sure", + "start": 63.58, + "end": 63.72, + "confidence": 0.976 + }, + { + "text": "that,", + "start": 63.72, + "end": 63.98, + "confidence": 0.293 + }, + { + "text": "uh,", + "start": 64.08, + "end": 64.32, + "confidence": 0.628 + }, + { + "text": "just", + "start": 64.34, + "end": 64.6, + "confidence": 0.34 + }, + { + "text": "a", + "start": 64.6, + "end": 64.76, + "confidence": 0.297 + }, + { + "text": "suggestion.", + "start": 64.76, + "end": 65.1, + "confidence": 0.493 + } + ] + }, + { + "id": 32, + "seek": 5400, + "start": 65.1, + "end": 67.5, + "text": " We thought we'd, uh, that you could check it out.", + "tokens": [ + 50914, + 492, + 1194, + 321, + 1116, + 11, + 2232, + 11, + 300, + 291, + 727, + 1520, + 309, + 484, + 13, + 51014 + ], + "temperature": 0.6000000000000001, + "avg_logprob": -0.46983818116226816, + "compression_ratio": 1.5763546798029557, + "no_speech_prob": 0.2010825127363205, + "confidence": 0.36, + "words": [ + { + "text": "We", + "start": 65.1, + "end": 65.3, + "confidence": 0.11 + }, + { + "text": "thought", + "start": 65.3, + "end": 65.54, + "confidence": 0.863 + }, + { + "text": "we'd,", + "start": 65.54, + "end": 65.84, + "confidence": 0.408 + }, + { + "text": "uh,", + "start": 65.9, + "end": 66.02, + "confidence": 0.641 + }, + { + "text": "that", + "start": 66.78, + "end": 66.92, + "confidence": 0.043 + }, + { + "text": "you", + "start": 66.92, + "end": 67.08, + "confidence": 0.967 + }, + { + "text": "could", + "start": 67.08, + "end": 67.24, + "confidence": 0.851 + }, + { + "text": "check", + "start": 67.24, + "end": 67.4, + "confidence": 0.13 + }, + { + "text": "it", + "start": 67.4, + "end": 67.48, + "confidence": 0.176 + }, + { + "text": "out.", + "start": 67.48, + "end": 67.5, + "confidence": 0.53 + } + ] + }, + { + "id": 33, + "seek": 5400, + "start": 68.18, + "end": 69.08, + "text": " It's not much of an order, sir.", + "tokens": [ + 51014, + 467, + 311, + 406, + 709, + 295, + 364, + 1668, + 11, + 4735, + 13, + 51114 + ], + "temperature": 0.6000000000000001, + "avg_logprob": -0.46983818116226816, + "compression_ratio": 1.5763546798029557, + "no_speech_prob": 0.2010825127363205, + "confidence": 0.173, + "words": [ + { + "text": "It's", + "start": 68.18, + "end": 68.22, + "confidence": 0.069 + }, + { + "text": "not", + "start": 68.22, + "end": 68.38, + "confidence": 0.17 + }, + { + "text": "much", + "start": 68.38, + "end": 68.54, + "confidence": 0.29 + }, + { + "text": "of", + "start": 68.54, + "end": 68.68, + "confidence": 0.474 + }, + { + "text": "an", + "start": 68.68, + "end": 68.84, + "confidence": 0.246 + }, + { + "text": "order,", + "start": 68.84, + "end": 68.88, + "confidence": 0.317 + }, + { + "text": "sir.", + "start": 69.02, + "end": 69.08, + "confidence": 0.094 + } + ] + }, + { + "id": 34, + "seek": 5400, + "start": 69.08, + "end": 71.92, + "text": " And so, uh, I guess we're gonna come up with this.", + "tokens": [ + 51114, + 400, + 370, + 11, + 2232, + 11, + 286, + 2041, + 321, + 434, + 799, + 808, + 493, + 365, + 341, + 13, + 51264 + ], + "temperature": 0.6000000000000001, + "avg_logprob": -0.46983818116226816, + "compression_ratio": 1.5763546798029557, + "no_speech_prob": 0.2010825127363205, + "confidence": 0.393, + "words": [ + { + "text": "And", + "start": 69.08, + "end": 69.24, + "confidence": 0.078 + }, + { + "text": "so,", + "start": 69.24, + "end": 69.6, + "confidence": 0.546 + }, + { + "text": "uh,", + "start": 69.72, + "end": 69.84, + "confidence": 0.387 + }, + { + "text": "I", + "start": 70.36, + "end": 70.5, + "confidence": 0.938 + }, + { + "text": "guess", + "start": 70.5, + "end": 70.66, + "confidence": 0.976 + }, + { + "text": "we're", + "start": 70.66, + "end": 71.08, + "confidence": 0.4 + }, + { + "text": "gonna", + "start": 71.08, + "end": 71.26, + "confidence": 0.375 + }, + { + "text": "come", + "start": 71.26, + "end": 71.42, + "confidence": 0.171 + }, + { + "text": "up", + "start": 71.42, + "end": 71.62, + "confidence": 0.79 + }, + { + "text": "with", + "start": 71.62, + "end": 71.78, + "confidence": 0.86 + }, + { + "text": "this.", + "start": 71.78, + "end": 71.92, + "confidence": 0.192 + } + ] + }, + { + "id": 35, + "seek": 5400, + "start": 71.92, + "end": 72.46, + "text": " Let us know.", + "tokens": [ + 51264, + 961, + 505, + 458, + 13, + 51314 + ], + "temperature": 0.6000000000000001, + "avg_logprob": -0.46983818116226816, + "compression_ratio": 1.5763546798029557, + "no_speech_prob": 0.2010825127363205, + "confidence": 0.405, + "words": [ + { + "text": "Let", + "start": 71.92, + "end": 72.08, + "confidence": 0.09 + }, + { + "text": "us", + "start": 72.08, + "end": 72.24, + "confidence": 0.457 + }, + { + "text": "know.", + "start": 72.24, + "end": 72.46, + "confidence": 0.809 + } + ] + }, + { + "id": 36, + "seek": 5400, + "start": 74.16, + "end": 74.18, + "text": " Okay.", + "tokens": [ + 51314, + 1033, + 13, + 51364 + ], + "temperature": 0.6000000000000001, + "avg_logprob": -0.46983818116226816, + "compression_ratio": 1.5763546798029557, + "no_speech_prob": 0.2010825127363205, + "confidence": 0.024, + "words": [ + { + "text": "Okay.", + "start": 74.16, + "end": 74.18, + "confidence": 0.024 + } + ] + }, + { + "id": 37, + "seek": 5400, + "start": 74.18, + "end": 75.06, + "text": " No problem.", + "tokens": [ + 51364, + 883, + 1154, + 13, + 51414 + ], + "temperature": 0.6000000000000001, + "avg_logprob": -0.46983818116226816, + "compression_ratio": 1.5763546798029557, + "no_speech_prob": 0.2010825127363205, + "confidence": 0.041, + "words": [ + { + "text": "No", + "start": 74.18, + "end": 74.4, + "confidence": 0.004 + }, + { + "text": "problem.", + "start": 74.4, + "end": 75.06, + "confidence": 0.124 + } + ] + }, + { + "id": 38, + "seek": 5400, + "start": 75.2, + "end": 75.82, + "text": " Okay.", + "tokens": [ + 51414, + 1033, + 13, + 51464 + ], + "temperature": 0.6000000000000001, + "avg_logprob": -0.46983818116226816, + "compression_ratio": 1.5763546798029557, + "no_speech_prob": 0.2010825127363205, + "confidence": 0.236, + "words": [ + { + "text": "Okay.", + "start": 75.2, + "end": 75.82, + "confidence": 0.236 + } + ] + }, + { + "id": 39, + "seek": 5400, + "start": 75.82, + "end": 76.52, + "text": " No problem.", + "tokens": [ + 51464, + 883, + 1154, + 13, + 51514 + ], + "temperature": 0.6000000000000001, + "avg_logprob": -0.46983818116226816, + "compression_ratio": 1.5763546798029557, + "no_speech_prob": 0.2010825127363205, + "confidence": 0.456, + "words": [ + { + "text": "No", + "start": 75.82, + "end": 76.16, + "confidence": 0.216 + }, + { + "text": "problem.", + "start": 76.16, + "end": 76.52, + "confidence": 0.663 + } + ] + }, + { + "id": 40, + "seek": 5400, + "start": 78.48, + "end": 78.52, + "text": " No problem.", + "tokens": [ + 51514, + 883, + 1154, + 13, + 51564 + ], + "temperature": 0.6000000000000001, + "avg_logprob": -0.46983818116226816, + "compression_ratio": 1.5763546798029557, + "no_speech_prob": 0.2010825127363205, + "confidence": 0.021, + "words": [ + { + "text": "No", + "start": 78.48, + "end": 78.5, + "confidence": 0.016 + }, + { + "text": "problem.", + "start": 78.5, + "end": 78.52, + "confidence": 0.024 + } + ] + }, + { + "id": 41, + "seek": 5400, + "start": 78.52, + "end": 79.3, + "text": " No worry.", + "tokens": [ + 51564, + 883, + 3292, + 13, + 51614 + ], + "temperature": 0.6000000000000001, + "avg_logprob": -0.46983818116226816, + "compression_ratio": 1.5763546798029557, + "no_speech_prob": 0.2010825127363205, + "confidence": 0.003, + "words": [ + { + "text": "No", + "start": 78.52, + "end": 78.7, + "confidence": 0.001 + }, + { + "text": "worry.", + "start": 78.7, + "end": 79.3, + "confidence": 0.005 + } + ] + }, + { + "id": 42, + "seek": 5400, + "start": 79.3, + "end": 80.04, + "text": " None.", + "tokens": [ + 51614, + 14492, + 13, + 51664 + ], + "temperature": 0.6000000000000001, + "avg_logprob": -0.46983818116226816, + "compression_ratio": 1.5763546798029557, + "no_speech_prob": 0.2010825127363205, + "confidence": 0.002, + "words": [ + { + "text": "None.", + "start": 79.3, + "end": 80.04, + "confidence": 0.002 + } + ] + }, + { + "id": 43, + "seek": 8000, + "start": 88.8, + "end": 88.98, + "text": " Thank you.", + "tokens": [ + 50364, + 1044, + 291, + 13, + 50818 + ], + "temperature": 0.0, + "avg_logprob": -0.9733104705810547, + "compression_ratio": 0.5555555555555556, + "no_speech_prob": 0.4526429772377014, + "confidence": 0.261, + "words": [ + { + "text": "Thank", + "start": 88.8, + "end": 88.92, + "confidence": 0.026 + }, + { + "text": "you.", + "start": 88.92, + "end": 88.98, + "confidence": 0.83 + } + ] + } + ], + "language": "en" +} \ No newline at end of file diff --git a/tests/expected/naive/naive_apollo11.mp3.words.json b/tests/expected/naive/naive_apollo11.mp3.words.json new file mode 100644 index 0000000000000000000000000000000000000000..97affdfce771a65f33d19d1dce35134b2c1677a1 --- /dev/null +++ b/tests/expected/naive/naive_apollo11.mp3.words.json @@ -0,0 +1,3820 @@ +{ + "text": " Apollo 11, Houston we got a recommendation for you on your Soyuz-VA GLEME GVA. Alright, okay, we like to say that they make the one that's on the helmet we're going to have in B1. And you can put the other one on the mic helmet with those GVA blizzard frames. Alright, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them", + "segments": [ + { + "id": 0, + "seek": 0, + "start": 0.54, + "end": 6.56, + "text": " Apollo 11, Houston we got a recommendation for you on your Soyuz-VA GLEME GVA.", + "tokens": [ + 50364, + 25187, + 2975, + 11, + 18717, + 321, + 658, + 257, + 11879, + 337, + 291, + 322, + 428, + 24758, + 3334, + 12, + 20914, + 460, + 2634, + 15454, + 460, + 20914, + 13, + 50714 + ], + "temperature": 0.0, + "avg_logprob": -0.7225757398103413, + "compression_ratio": 1.39247311827957, + "no_speech_prob": 0.44998496770858765, + "confidence": 0.494, + "words": [ + { + "text": "Apollo", + "start": 0.54, + "end": 0.92, + "confidence": 0.425 + }, + { + "text": "11,", + "start": 0.92, + "end": 1.26, + "confidence": 0.842 + }, + { + "text": "Houston", + "start": 1.52, + "end": 1.72, + "confidence": 0.974 + }, + { + "text": "we", + "start": 1.72, + "end": 1.92, + "confidence": 0.453 + }, + { + "text": "got", + "start": 1.92, + "end": 2.1, + "confidence": 0.791 + }, + { + "text": "a", + "start": 2.1, + "end": 2.26, + "confidence": 0.992 + }, + { + "text": "recommendation", + "start": 2.26, + "end": 2.86, + "confidence": 0.97 + }, + { + "text": "for", + "start": 2.86, + "end": 3.44, + "confidence": 0.945 + }, + { + "text": "you", + "start": 3.44, + "end": 3.6, + "confidence": 0.99 + }, + { + "text": "on", + "start": 3.6, + "end": 3.72, + "confidence": 0.935 + }, + { + "text": "your", + "start": 3.72, + "end": 3.92, + "confidence": 0.974 + }, + { + "text": "Soyuz-VA", + "start": 3.92, + "end": 5.16, + "confidence": 0.327 + }, + { + "text": "GLEME", + "start": 5.16, + "end": 5.72, + "confidence": 0.178 + }, + { + "text": "GVA.", + "start": 5.72, + "end": 6.56, + "confidence": 0.321 + } + ] + }, + { + "id": 1, + "seek": 0, + "start": 10.8, + "end": 19.08, + "text": " Alright, okay, we like to say that they make the one that's on the helmet we're going to have in B1.", + "tokens": [ + 50714, + 2798, + 11, + 1392, + 11, + 321, + 411, + 281, + 584, + 300, + 436, + 652, + 264, + 472, + 300, + 311, + 322, + 264, + 15922, + 321, + 434, + 516, + 281, + 362, + 294, + 363, + 16, + 13, + 51314 + ], + "temperature": 0.0, + "avg_logprob": -0.7225757398103413, + "compression_ratio": 1.39247311827957, + "no_speech_prob": 0.44998496770858765, + "confidence": 0.311, + "words": [ + { + "text": "Alright,", + "start": 10.8, + "end": 10.82, + "confidence": 0.055 + }, + { + "text": "okay,", + "start": 11.46, + "end": 12.2, + "confidence": 0.359 + }, + { + "text": "we", + "start": 12.44, + "end": 12.96, + "confidence": 0.347 + }, + { + "text": "like", + "start": 12.96, + "end": 13.28, + "confidence": 0.512 + }, + { + "text": "to", + "start": 13.28, + "end": 13.6, + "confidence": 0.156 + }, + { + "text": "say", + "start": 13.6, + "end": 14.9, + "confidence": 0.086 + }, + { + "text": "that", + "start": 14.9, + "end": 15.32, + "confidence": 0.273 + }, + { + "text": "they", + "start": 15.32, + "end": 15.46, + "confidence": 0.358 + }, + { + "text": "make", + "start": 15.46, + "end": 15.7, + "confidence": 0.127 + }, + { + "text": "the", + "start": 15.7, + "end": 15.86, + "confidence": 0.165 + }, + { + "text": "one", + "start": 15.86, + "end": 16.08, + "confidence": 0.428 + }, + { + "text": "that's", + "start": 16.08, + "end": 16.26, + "confidence": 0.357 + }, + { + "text": "on", + "start": 16.26, + "end": 16.46, + "confidence": 0.314 + }, + { + "text": "the", + "start": 16.46, + "end": 16.76, + "confidence": 0.498 + }, + { + "text": "helmet", + "start": 16.76, + "end": 17.26, + "confidence": 0.306 + }, + { + "text": "we're", + "start": 17.26, + "end": 17.78, + "confidence": 0.256 + }, + { + "text": "going", + "start": 17.78, + "end": 17.94, + "confidence": 0.478 + }, + { + "text": "to", + "start": 17.94, + "end": 18.1, + "confidence": 0.522 + }, + { + "text": "have", + "start": 18.1, + "end": 18.18, + "confidence": 0.804 + }, + { + "text": "in", + "start": 18.18, + "end": 18.36, + "confidence": 0.772 + }, + { + "text": "B1.", + "start": 18.36, + "end": 19.08, + "confidence": 0.738 + } + ] + }, + { + "id": 2, + "seek": 0, + "start": 19.08, + "end": 24.54, + "text": " And you can put the other one on the mic helmet with those GVA blizzard frames.", + "tokens": [ + 51314, + 400, + 291, + 393, + 829, + 264, + 661, + 472, + 322, + 264, + 3123, + 15922, + 365, + 729, + 460, + 20914, + 888, + 31062, + 12083, + 13, + 51614 + ], + "temperature": 0.0, + "avg_logprob": -0.7225757398103413, + "compression_ratio": 1.39247311827957, + "no_speech_prob": 0.44998496770858765, + "confidence": 0.129, + "words": [ + { + "text": "And", + "start": 19.08, + "end": 20.14, + "confidence": 0.232 + }, + { + "text": "you", + "start": 20.14, + "end": 20.32, + "confidence": 0.905 + }, + { + "text": "can", + "start": 20.32, + "end": 20.5, + "confidence": 0.422 + }, + { + "text": "put", + "start": 20.5, + "end": 20.64, + "confidence": 0.942 + }, + { + "text": "the", + "start": 20.64, + "end": 20.82, + "confidence": 0.983 + }, + { + "text": "other", + "start": 20.82, + "end": 21.0, + "confidence": 0.994 + }, + { + "text": "one", + "start": 21.0, + "end": 21.18, + "confidence": 0.965 + }, + { + "text": "on", + "start": 21.18, + "end": 21.36, + "confidence": 0.965 + }, + { + "text": "the", + "start": 21.36, + "end": 21.78, + "confidence": 0.187 + }, + { + "text": "mic", + "start": 21.78, + "end": 22.48, + "confidence": 0.586 + }, + { + "text": "helmet", + "start": 22.48, + "end": 22.82, + "confidence": 0.029 + }, + { + "text": "with", + "start": 22.82, + "end": 23.06, + "confidence": 0.047 + }, + { + "text": "those", + "start": 23.06, + "end": 23.3, + "confidence": 0.036 + }, + { + "text": "GVA", + "start": 23.3, + "end": 23.74, + "confidence": 0.001 + }, + { + "text": "blizzard", + "start": 23.74, + "end": 24.18, + "confidence": 0.022 + }, + { + "text": "frames.", + "start": 24.18, + "end": 24.54, + "confidence": 0.225 + } + ] + }, + { + "id": 3, + "seek": 2500, + "start": 31.34, + "end": 54.52, + "text": " Alright, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them", + "tokens": [ + 50364, + 2798, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552 + ], + "temperature": 0.0, + "avg_logprob": -0.11148937649197048, + "compression_ratio": 24.096774193548388, + "no_speech_prob": 0.4302051365375519, + "confidence": 0.885, + "words": [ + { + "text": "Alright,", + "start": 31.34, + "end": 31.52, + "confidence": 0.069 + }, + { + "text": "got", + "start": 31.82, + "end": 31.86, + "confidence": 0.144 + }, + { + "text": "them,", + "start": 31.86, + "end": 32.1, + "confidence": 0.194 + }, + { + "text": "got", + "start": 32.38, + "end": 32.88, + "confidence": 0.473 + }, + { + "text": "them,", + "start": 32.88, + "end": 33.48, + "confidence": 0.611 + }, + { + "text": "got", + "start": 33.5, + "end": 33.52, + "confidence": 0.574 + }, + { + "text": "them,", + "start": 33.52, + "end": 33.54, + "confidence": 0.51 + }, + { + "text": "got", + "start": 33.76, + "end": 33.78, + "confidence": 0.599 + }, + { + "text": "them,", + "start": 33.78, + "end": 33.88, + "confidence": 0.488 + }, + { + "text": "got", + "start": 34.12, + "end": 34.14, + "confidence": 0.724 + }, + { + "text": "them,", + "start": 34.14, + "end": 34.16, + "confidence": 0.567 + }, + { + "text": "got", + "start": 34.16, + "end": 34.18, + "confidence": 0.761 + }, + { + "text": "them,", + "start": 34.18, + "end": 34.34, + "confidence": 0.689 + }, + { + "text": "got", + "start": 34.34, + "end": 34.36, + "confidence": 0.851 + }, + { + "text": "them,", + "start": 34.36, + "end": 34.5, + "confidence": 0.813 + }, + { + "text": "got", + "start": 34.5, + "end": 34.64, + "confidence": 0.916 + }, + { + "text": "them,", + "start": 34.64, + "end": 34.66, + "confidence": 0.756 + }, + { + "text": "got", + "start": 34.82, + "end": 34.92, + "confidence": 0.467 + }, + { + "text": "them,", + "start": 34.92, + "end": 35.0, + "confidence": 0.851 + }, + { + "text": "got", + "start": 35.0, + "end": 35.02, + "confidence": 0.917 + }, + { + "text": "them,", + "start": 35.02, + "end": 35.1, + "confidence": 0.897 + }, + { + "text": "got", + "start": 35.1, + "end": 35.28, + "confidence": 0.923 + }, + { + "text": "them,", + "start": 35.28, + "end": 35.64, + "confidence": 0.911 + }, + { + "text": "got", + "start": 35.66, + "end": 35.68, + "confidence": 0.923 + }, + { + "text": "them,", + "start": 35.68, + "end": 35.7, + "confidence": 0.917 + }, + { + "text": "got", + "start": 35.74, + "end": 35.76, + "confidence": 0.935 + }, + { + "text": "them,", + "start": 35.76, + "end": 35.78, + "confidence": 0.915 + }, + { + "text": "got", + "start": 36.04, + "end": 36.36, + "confidence": 0.944 + }, + { + "text": "them,", + "start": 36.36, + "end": 36.68, + "confidence": 0.91 + }, + { + "text": "got", + "start": 36.68, + "end": 36.7, + "confidence": 0.934 + }, + { + "text": "them,", + "start": 36.7, + "end": 36.72, + "confidence": 0.916 + }, + { + "text": "got", + "start": 36.72, + "end": 36.74, + "confidence": 0.926 + }, + { + "text": "them,", + "start": 36.74, + "end": 36.76, + "confidence": 0.92 + }, + { + "text": "got", + "start": 36.76, + "end": 36.78, + "confidence": 0.926 + }, + { + "text": "them,", + "start": 36.78, + "end": 36.8, + "confidence": 0.924 + }, + { + "text": "got", + "start": 36.8, + "end": 36.82, + "confidence": 0.932 + }, + { + "text": "them,", + "start": 36.82, + "end": 36.84, + "confidence": 0.93 + }, + { + "text": "got", + "start": 36.84, + "end": 36.86, + "confidence": 0.935 + }, + { + "text": "them,", + "start": 36.86, + "end": 36.88, + "confidence": 0.937 + }, + { + "text": "got", + "start": 36.88, + "end": 37.46, + "confidence": 0.941 + }, + { + "text": "them,", + "start": 37.46, + "end": 37.82, + "confidence": 0.942 + }, + { + "text": "got", + "start": 37.82, + "end": 37.84, + "confidence": 0.943 + }, + { + "text": "them,", + "start": 37.84, + "end": 38.12, + "confidence": 0.945 + }, + { + "text": "got", + "start": 38.12, + "end": 38.14, + "confidence": 0.947 + }, + { + "text": "them,", + "start": 38.14, + "end": 38.16, + "confidence": 0.948 + }, + { + "text": "got", + "start": 38.16, + "end": 38.18, + "confidence": 0.948 + }, + { + "text": "them,", + "start": 38.18, + "end": 38.2, + "confidence": 0.951 + }, + { + "text": "got", + "start": 38.2, + "end": 38.22, + "confidence": 0.95 + }, + { + "text": "them,", + "start": 38.22, + "end": 38.54, + "confidence": 0.953 + }, + { + "text": "got", + "start": 38.54, + "end": 38.56, + "confidence": 0.952 + }, + { + "text": "them,", + "start": 38.56, + "end": 38.58, + "confidence": 0.956 + }, + { + "text": "got", + "start": 38.58, + "end": 38.6, + "confidence": 0.952 + }, + { + "text": "them,", + "start": 38.6, + "end": 38.62, + "confidence": 0.956 + }, + { + "text": "got", + "start": 38.62, + "end": 38.64, + "confidence": 0.954 + }, + { + "text": "them,", + "start": 38.64, + "end": 38.66, + "confidence": 0.958 + }, + { + "text": "got", + "start": 38.66, + "end": 38.68, + "confidence": 0.956 + }, + { + "text": "them,", + "start": 38.68, + "end": 38.7, + "confidence": 0.961 + }, + { + "text": "got", + "start": 38.7, + "end": 38.72, + "confidence": 0.956 + }, + { + "text": "them,", + "start": 38.72, + "end": 38.74, + "confidence": 0.961 + }, + { + "text": "got", + "start": 38.74, + "end": 38.76, + "confidence": 0.957 + }, + { + "text": "them,", + "start": 38.76, + "end": 38.78, + "confidence": 0.962 + }, + { + "text": "got", + "start": 38.78, + "end": 38.8, + "confidence": 0.957 + }, + { + "text": "them,", + "start": 38.8, + "end": 38.82, + "confidence": 0.964 + }, + { + "text": "got", + "start": 38.82, + "end": 38.84, + "confidence": 0.958 + }, + { + "text": "them,", + "start": 38.84, + "end": 38.86, + "confidence": 0.964 + }, + { + "text": "got", + "start": 38.86, + "end": 38.88, + "confidence": 0.959 + }, + { + "text": "them,", + "start": 38.88, + "end": 38.9, + "confidence": 0.965 + }, + { + "text": "got", + "start": 38.9, + "end": 38.92, + "confidence": 0.961 + }, + { + "text": "them,", + "start": 38.92, + "end": 38.94, + "confidence": 0.968 + }, + { + "text": "got", + "start": 38.94, + "end": 38.96, + "confidence": 0.964 + }, + { + "text": "them,", + "start": 38.96, + "end": 38.98, + "confidence": 0.969 + }, + { + "text": "got", + "start": 38.98, + "end": 39.0, + "confidence": 0.964 + }, + { + "text": "them,", + "start": 39.0, + "end": 39.02, + "confidence": 0.968 + }, + { + "text": "got", + "start": 39.02, + "end": 39.04, + "confidence": 0.965 + }, + { + "text": "them,", + "start": 39.04, + "end": 39.06, + "confidence": 0.971 + }, + { + "text": "got", + "start": 39.06, + "end": 39.08, + "confidence": 0.967 + }, + { + "text": "them,", + "start": 39.08, + "end": 39.1, + "confidence": 0.971 + }, + { + "text": "got", + "start": 39.1, + "end": 39.12, + "confidence": 0.969 + }, + { + "text": "them,", + "start": 39.12, + "end": 39.14, + "confidence": 0.974 + }, + { + "text": "got", + "start": 39.14, + "end": 39.16, + "confidence": 0.97 + }, + { + "text": "them,", + "start": 39.16, + "end": 39.18, + "confidence": 0.974 + }, + { + "text": "got", + "start": 39.18, + "end": 39.2, + "confidence": 0.972 + }, + { + "text": "them,", + "start": 39.2, + "end": 39.22, + "confidence": 0.975 + }, + { + "text": "got", + "start": 39.22, + "end": 39.24, + "confidence": 0.975 + }, + { + "text": "them,", + "start": 39.24, + "end": 39.26, + "confidence": 0.976 + }, + { + "text": "got", + "start": 39.26, + "end": 39.28, + "confidence": 0.977 + }, + { + "text": "them,", + "start": 39.28, + "end": 39.3, + "confidence": 0.978 + }, + { + "text": "got", + "start": 39.3, + "end": 39.32, + "confidence": 0.978 + }, + { + "text": "them,", + "start": 39.32, + "end": 39.34, + "confidence": 0.979 + }, + { + "text": "got", + "start": 39.34, + "end": 39.36, + "confidence": 0.979 + }, + { + "text": "them,", + "start": 39.36, + "end": 39.38, + "confidence": 0.979 + }, + { + "text": "got", + "start": 39.38, + "end": 39.4, + "confidence": 0.981 + }, + { + "text": "them,", + "start": 39.4, + "end": 39.42, + "confidence": 0.98 + }, + { + "text": "got", + "start": 39.42, + "end": 39.44, + "confidence": 0.983 + }, + { + "text": "them,", + "start": 39.44, + "end": 39.46, + "confidence": 0.981 + }, + { + "text": "got", + "start": 39.46, + "end": 39.48, + "confidence": 0.984 + }, + { + "text": "them,", + "start": 39.48, + "end": 39.5, + "confidence": 0.982 + }, + { + "text": "got", + "start": 39.5, + "end": 39.52, + "confidence": 0.985 + }, + { + "text": "them,", + "start": 39.52, + "end": 39.54, + "confidence": 0.983 + }, + { + "text": "got", + "start": 39.54, + "end": 39.56, + "confidence": 0.987 + }, + { + "text": "them,", + "start": 39.56, + "end": 39.58, + "confidence": 0.984 + }, + { + "text": "got", + "start": 39.58, + "end": 39.6, + "confidence": 0.989 + }, + { + "text": "them,", + "start": 39.6, + "end": 39.62, + "confidence": 0.983 + }, + { + "text": "got", + "start": 39.62, + "end": 39.64, + "confidence": 0.99 + }, + { + "text": "them,", + "start": 39.64, + "end": 39.66, + "confidence": 0.984 + }, + { + "text": "got", + "start": 39.66, + "end": 39.68, + "confidence": 0.99 + }, + { + "text": "them,", + "start": 39.68, + "end": 39.7, + "confidence": 0.985 + }, + { + "text": "got", + "start": 39.7, + "end": 39.72, + "confidence": 0.991 + }, + { + "text": "them,", + "start": 39.72, + "end": 39.74, + "confidence": 0.986 + }, + { + "text": "got", + "start": 39.74, + "end": 39.76, + "confidence": 0.991 + }, + { + "text": "them,", + "start": 39.76, + "end": 39.78, + "confidence": 0.986 + }, + { + "text": "got", + "start": 39.78, + "end": 39.8, + "confidence": 0.992 + }, + { + "text": "them,", + "start": 39.8, + "end": 39.82, + "confidence": 0.986 + }, + { + "text": "got", + "start": 39.82, + "end": 39.84, + "confidence": 0.992 + }, + { + "text": "them,", + "start": 39.84, + "end": 39.86, + "confidence": 0.986 + }, + { + "text": "got", + "start": 39.86, + "end": 39.88, + "confidence": 0.993 + }, + { + "text": "them,", + "start": 39.88, + "end": 39.9, + "confidence": 0.987 + }, + { + "text": "got", + "start": 39.9, + "end": 39.92, + "confidence": 0.993 + }, + { + "text": "them,", + "start": 39.92, + "end": 39.94, + "confidence": 0.987 + }, + { + "text": "got", + "start": 39.94, + "end": 39.96, + "confidence": 0.994 + }, + { + "text": "them,", + "start": 39.96, + "end": 39.98, + "confidence": 0.988 + }, + { + "text": "got", + "start": 39.98, + "end": 40.0, + "confidence": 0.994 + }, + { + "text": "them,", + "start": 40.0, + "end": 40.02, + "confidence": 0.988 + }, + { + "text": "got", + "start": 40.02, + "end": 40.42, + "confidence": 0.994 + }, + { + "text": "them,", + "start": 40.42, + "end": 40.68, + "confidence": 0.988 + }, + { + "text": "got", + "start": 41.04, + "end": 41.06, + "confidence": 0.994 + }, + { + "text": "them,", + "start": 41.06, + "end": 41.54, + "confidence": 0.988 + }, + { + "text": "got", + "start": 41.88, + "end": 41.9, + "confidence": 0.994 + }, + { + "text": "them,", + "start": 41.9, + "end": 42.48, + "confidence": 0.987 + }, + { + "text": "got", + "start": 42.68, + "end": 42.7, + "confidence": 0.995 + }, + { + "text": "them,", + "start": 42.7, + "end": 43.0, + "confidence": 0.989 + }, + { + "text": "got", + "start": 43.54, + "end": 44.06, + "confidence": 0.995 + }, + { + "text": "them,", + "start": 44.06, + "end": 45.16, + "confidence": 0.989 + }, + { + "text": "got", + "start": 45.16, + "end": 45.46, + "confidence": 0.995 + }, + { + "text": "them,", + "start": 45.46, + "end": 45.8, + "confidence": 0.99 + }, + { + "text": "got", + "start": 45.82, + "end": 46.22, + "confidence": 0.995 + }, + { + "text": "them,", + "start": 46.22, + "end": 46.38, + "confidence": 0.989 + }, + { + "text": "got", + "start": 46.6, + "end": 47.0, + "confidence": 0.995 + }, + { + "text": "them,", + "start": 47.0, + "end": 47.76, + "confidence": 0.99 + }, + { + "text": "got", + "start": 48.18, + "end": 48.46, + "confidence": 0.995 + }, + { + "text": "them,", + "start": 48.46, + "end": 48.9, + "confidence": 0.99 + }, + { + "text": "got", + "start": 48.9, + "end": 49.2, + "confidence": 0.995 + }, + { + "text": "them,", + "start": 49.2, + "end": 49.84, + "confidence": 0.99 + }, + { + "text": "got", + "start": 50.36, + "end": 50.38, + "confidence": 0.995 + }, + { + "text": "them,", + "start": 50.38, + "end": 50.76, + "confidence": 0.99 + }, + { + "text": "got", + "start": 51.5, + "end": 51.74, + "confidence": 0.995 + }, + { + "text": "them,", + "start": 51.74, + "end": 52.34, + "confidence": 0.99 + }, + { + "text": "got", + "start": 52.44, + "end": 53.28, + "confidence": 0.994 + }, + { + "text": "them", + "start": 53.28, + "end": 54.52, + "confidence": 0.996 + } + ] + }, + { + "id": 4, + "seek": 5500, + "start": 54.52, + "end": 84.46, + "text": " got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them", + "tokens": [ + 50364, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552 + ], + "temperature": 0.0, + "avg_logprob": -0.05314932168866487, + "compression_ratio": 29.52, + "no_speech_prob": 0.2454655021429062, + "confidence": 0.844, + "words": [ + { + "text": "got", + "start": 54.52, + "end": 54.82, + "confidence": 0.002 + }, + { + "text": "them,", + "start": 54.82, + "end": 54.84, + "confidence": 0.016 + }, + { + "text": "got", + "start": 54.84, + "end": 55.14, + "confidence": 0.039 + }, + { + "text": "them,", + "start": 55.14, + "end": 55.56, + "confidence": 0.421 + }, + { + "text": "got", + "start": 55.56, + "end": 56.58, + "confidence": 0.645 + }, + { + "text": "them,", + "start": 56.58, + "end": 56.6, + "confidence": 0.595 + }, + { + "text": "got", + "start": 56.6, + "end": 57.36, + "confidence": 0.78 + }, + { + "text": "them,", + "start": 57.36, + "end": 57.52, + "confidence": 0.639 + }, + { + "text": "got", + "start": 57.76, + "end": 58.22, + "confidence": 0.846 + }, + { + "text": "them,", + "start": 58.22, + "end": 58.26, + "confidence": 0.668 + }, + { + "text": "got", + "start": 58.74, + "end": 58.78, + "confidence": 0.876 + }, + { + "text": "them,", + "start": 58.78, + "end": 59.46, + "confidence": 0.672 + }, + { + "text": "got", + "start": 59.88, + "end": 59.9, + "confidence": 0.836 + }, + { + "text": "them,", + "start": 59.9, + "end": 60.32, + "confidence": 0.74 + }, + { + "text": "got", + "start": 60.52, + "end": 60.6, + "confidence": 0.884 + }, + { + "text": "them,", + "start": 60.6, + "end": 60.7, + "confidence": 0.814 + }, + { + "text": "got", + "start": 60.8, + "end": 60.98, + "confidence": 0.911 + }, + { + "text": "them,", + "start": 60.98, + "end": 61.78, + "confidence": 0.567 + }, + { + "text": "got", + "start": 61.78, + "end": 61.8, + "confidence": 0.122 + }, + { + "text": "them,", + "start": 61.8, + "end": 61.82, + "confidence": 0.748 + }, + { + "text": "got", + "start": 61.82, + "end": 61.84, + "confidence": 0.75 + }, + { + "text": "them,", + "start": 61.84, + "end": 61.86, + "confidence": 0.818 + }, + { + "text": "got", + "start": 61.86, + "end": 61.88, + "confidence": 0.797 + }, + { + "text": "them,", + "start": 61.88, + "end": 61.9, + "confidence": 0.841 + }, + { + "text": "got", + "start": 61.9, + "end": 61.92, + "confidence": 0.81 + }, + { + "text": "them,", + "start": 61.92, + "end": 61.94, + "confidence": 0.864 + }, + { + "text": "got", + "start": 61.94, + "end": 61.96, + "confidence": 0.846 + }, + { + "text": "them,", + "start": 61.96, + "end": 61.98, + "confidence": 0.893 + }, + { + "text": "got", + "start": 61.98, + "end": 62.0, + "confidence": 0.889 + }, + { + "text": "them,", + "start": 62.0, + "end": 62.02, + "confidence": 0.91 + }, + { + "text": "got", + "start": 62.02, + "end": 62.04, + "confidence": 0.896 + }, + { + "text": "them,", + "start": 62.04, + "end": 62.06, + "confidence": 0.912 + }, + { + "text": "got", + "start": 62.06, + "end": 62.08, + "confidence": 0.877 + }, + { + "text": "them,", + "start": 62.08, + "end": 62.1, + "confidence": 0.923 + }, + { + "text": "got", + "start": 62.1, + "end": 62.12, + "confidence": 0.888 + }, + { + "text": "them,", + "start": 62.12, + "end": 62.14, + "confidence": 0.932 + }, + { + "text": "got", + "start": 62.14, + "end": 62.16, + "confidence": 0.896 + }, + { + "text": "them,", + "start": 62.16, + "end": 62.18, + "confidence": 0.94 + }, + { + "text": "got", + "start": 62.5, + "end": 62.72, + "confidence": 0.906 + }, + { + "text": "them,", + "start": 62.72, + "end": 62.74, + "confidence": 0.945 + }, + { + "text": "got", + "start": 62.74, + "end": 62.76, + "confidence": 0.912 + }, + { + "text": "them,", + "start": 62.76, + "end": 62.78, + "confidence": 0.95 + }, + { + "text": "got", + "start": 62.78, + "end": 62.8, + "confidence": 0.917 + }, + { + "text": "them,", + "start": 62.8, + "end": 62.82, + "confidence": 0.954 + }, + { + "text": "got", + "start": 62.82, + "end": 62.84, + "confidence": 0.923 + }, + { + "text": "them,", + "start": 62.84, + "end": 62.86, + "confidence": 0.957 + }, + { + "text": "got", + "start": 62.86, + "end": 62.88, + "confidence": 0.929 + }, + { + "text": "them,", + "start": 62.88, + "end": 62.9, + "confidence": 0.959 + }, + { + "text": "got", + "start": 62.9, + "end": 62.92, + "confidence": 0.933 + }, + { + "text": "them,", + "start": 62.92, + "end": 62.94, + "confidence": 0.962 + }, + { + "text": "got", + "start": 62.94, + "end": 62.96, + "confidence": 0.934 + }, + { + "text": "them,", + "start": 62.96, + "end": 62.98, + "confidence": 0.965 + }, + { + "text": "got", + "start": 62.98, + "end": 63.0, + "confidence": 0.935 + }, + { + "text": "them,", + "start": 63.0, + "end": 63.02, + "confidence": 0.965 + }, + { + "text": "got", + "start": 63.02, + "end": 63.04, + "confidence": 0.937 + }, + { + "text": "them,", + "start": 63.04, + "end": 63.06, + "confidence": 0.966 + }, + { + "text": "got", + "start": 63.06, + "end": 63.08, + "confidence": 0.94 + }, + { + "text": "them,", + "start": 63.08, + "end": 63.1, + "confidence": 0.967 + }, + { + "text": "got", + "start": 63.1, + "end": 63.12, + "confidence": 0.94 + }, + { + "text": "them,", + "start": 63.12, + "end": 63.14, + "confidence": 0.969 + }, + { + "text": "got", + "start": 63.14, + "end": 63.16, + "confidence": 0.942 + }, + { + "text": "them,", + "start": 63.16, + "end": 63.18, + "confidence": 0.969 + }, + { + "text": "got", + "start": 63.18, + "end": 63.2, + "confidence": 0.943 + }, + { + "text": "them,", + "start": 63.2, + "end": 63.22, + "confidence": 0.97 + }, + { + "text": "got", + "start": 63.22, + "end": 63.24, + "confidence": 0.944 + }, + { + "text": "them,", + "start": 63.24, + "end": 63.26, + "confidence": 0.971 + }, + { + "text": "got", + "start": 63.26, + "end": 63.28, + "confidence": 0.946 + }, + { + "text": "them,", + "start": 63.28, + "end": 63.3, + "confidence": 0.971 + }, + { + "text": "got", + "start": 63.3, + "end": 63.32, + "confidence": 0.947 + }, + { + "text": "them,", + "start": 63.32, + "end": 63.34, + "confidence": 0.972 + }, + { + "text": "got", + "start": 63.34, + "end": 63.36, + "confidence": 0.949 + }, + { + "text": "them,", + "start": 63.36, + "end": 63.38, + "confidence": 0.971 + }, + { + "text": "got", + "start": 63.38, + "end": 63.4, + "confidence": 0.951 + }, + { + "text": "them,", + "start": 63.4, + "end": 63.42, + "confidence": 0.973 + }, + { + "text": "got", + "start": 63.42, + "end": 63.44, + "confidence": 0.953 + }, + { + "text": "them,", + "start": 63.44, + "end": 63.46, + "confidence": 0.973 + }, + { + "text": "got", + "start": 63.46, + "end": 63.48, + "confidence": 0.955 + }, + { + "text": "them,", + "start": 63.48, + "end": 63.5, + "confidence": 0.974 + }, + { + "text": "got", + "start": 63.5, + "end": 63.52, + "confidence": 0.956 + }, + { + "text": "them,", + "start": 63.52, + "end": 63.54, + "confidence": 0.974 + }, + { + "text": "got", + "start": 63.54, + "end": 63.56, + "confidence": 0.957 + }, + { + "text": "them,", + "start": 63.56, + "end": 63.58, + "confidence": 0.975 + }, + { + "text": "got", + "start": 63.58, + "end": 63.6, + "confidence": 0.959 + }, + { + "text": "them,", + "start": 63.6, + "end": 63.62, + "confidence": 0.975 + }, + { + "text": "got", + "start": 63.62, + "end": 63.64, + "confidence": 0.962 + }, + { + "text": "them,", + "start": 63.64, + "end": 63.66, + "confidence": 0.975 + }, + { + "text": "got", + "start": 63.66, + "end": 63.68, + "confidence": 0.963 + }, + { + "text": "them,", + "start": 63.68, + "end": 63.7, + "confidence": 0.976 + }, + { + "text": "got", + "start": 63.7, + "end": 63.72, + "confidence": 0.965 + }, + { + "text": "them,", + "start": 63.72, + "end": 63.74, + "confidence": 0.976 + }, + { + "text": "got", + "start": 63.74, + "end": 63.76, + "confidence": 0.968 + }, + { + "text": "them,", + "start": 63.76, + "end": 63.78, + "confidence": 0.977 + }, + { + "text": "got", + "start": 63.78, + "end": 63.8, + "confidence": 0.97 + }, + { + "text": "them,", + "start": 63.8, + "end": 63.82, + "confidence": 0.977 + }, + { + "text": "got", + "start": 63.82, + "end": 63.84, + "confidence": 0.971 + }, + { + "text": "them,", + "start": 63.84, + "end": 63.86, + "confidence": 0.977 + }, + { + "text": "got", + "start": 63.86, + "end": 63.88, + "confidence": 0.973 + }, + { + "text": "them,", + "start": 63.88, + "end": 63.9, + "confidence": 0.977 + }, + { + "text": "got", + "start": 63.9, + "end": 63.92, + "confidence": 0.975 + }, + { + "text": "them,", + "start": 63.92, + "end": 63.94, + "confidence": 0.979 + }, + { + "text": "got", + "start": 63.94, + "end": 63.96, + "confidence": 0.976 + }, + { + "text": "them,", + "start": 63.96, + "end": 63.98, + "confidence": 0.979 + }, + { + "text": "got", + "start": 63.98, + "end": 64.0, + "confidence": 0.977 + }, + { + "text": "them,", + "start": 64.0, + "end": 64.02, + "confidence": 0.979 + }, + { + "text": "got", + "start": 64.02, + "end": 64.04, + "confidence": 0.979 + }, + { + "text": "them,", + "start": 64.04, + "end": 64.06, + "confidence": 0.979 + }, + { + "text": "got", + "start": 64.06, + "end": 64.08, + "confidence": 0.979 + }, + { + "text": "them,", + "start": 64.08, + "end": 64.1, + "confidence": 0.979 + }, + { + "text": "got", + "start": 64.1, + "end": 64.12, + "confidence": 0.981 + }, + { + "text": "them,", + "start": 64.12, + "end": 64.4, + "confidence": 0.98 + }, + { + "text": "got", + "start": 64.42, + "end": 64.58, + "confidence": 0.981 + }, + { + "text": "them,", + "start": 64.58, + "end": 64.64, + "confidence": 0.98 + }, + { + "text": "got", + "start": 64.74, + "end": 65.06, + "confidence": 0.982 + }, + { + "text": "them,", + "start": 65.06, + "end": 65.22, + "confidence": 0.98 + }, + { + "text": "got", + "start": 65.22, + "end": 65.98, + "confidence": 0.984 + }, + { + "text": "them,", + "start": 65.98, + "end": 66.26, + "confidence": 0.981 + }, + { + "text": "got", + "start": 66.28, + "end": 67.32, + "confidence": 0.984 + }, + { + "text": "them,", + "start": 67.32, + "end": 67.44, + "confidence": 0.982 + }, + { + "text": "got", + "start": 67.68, + "end": 67.7, + "confidence": 0.984 + }, + { + "text": "them,", + "start": 67.7, + "end": 67.88, + "confidence": 0.981 + }, + { + "text": "got", + "start": 67.92, + "end": 68.8, + "confidence": 0.985 + }, + { + "text": "them,", + "start": 68.8, + "end": 69.12, + "confidence": 0.982 + }, + { + "text": "got", + "start": 69.26, + "end": 69.28, + "confidence": 0.986 + }, + { + "text": "them,", + "start": 69.28, + "end": 69.42, + "confidence": 0.982 + }, + { + "text": "got", + "start": 69.82, + "end": 69.84, + "confidence": 0.986 + }, + { + "text": "them,", + "start": 69.84, + "end": 70.16, + "confidence": 0.982 + }, + { + "text": "got", + "start": 70.16, + "end": 70.52, + "confidence": 0.987 + }, + { + "text": "them,", + "start": 70.52, + "end": 71.38, + "confidence": 0.981 + }, + { + "text": "got", + "start": 71.38, + "end": 71.58, + "confidence": 0.988 + }, + { + "text": "them,", + "start": 71.58, + "end": 71.94, + "confidence": 0.982 + }, + { + "text": "got", + "start": 71.94, + "end": 72.12, + "confidence": 0.989 + }, + { + "text": "them,", + "start": 72.12, + "end": 72.76, + "confidence": 0.983 + }, + { + "text": "got", + "start": 72.9, + "end": 73.56, + "confidence": 0.989 + }, + { + "text": "them,", + "start": 73.56, + "end": 74.08, + "confidence": 0.983 + }, + { + "text": "got", + "start": 74.68, + "end": 75.08, + "confidence": 0.99 + }, + { + "text": "them,", + "start": 75.08, + "end": 75.18, + "confidence": 0.984 + }, + { + "text": "got", + "start": 75.2, + "end": 76.42, + "confidence": 0.99 + }, + { + "text": "them,", + "start": 76.42, + "end": 76.6, + "confidence": 0.983 + }, + { + "text": "got", + "start": 76.6, + "end": 76.8, + "confidence": 0.991 + }, + { + "text": "them,", + "start": 76.8, + "end": 77.06, + "confidence": 0.985 + }, + { + "text": "got", + "start": 77.06, + "end": 77.44, + "confidence": 0.991 + }, + { + "text": "them,", + "start": 77.44, + "end": 77.78, + "confidence": 0.984 + }, + { + "text": "got", + "start": 78.22, + "end": 78.24, + "confidence": 0.992 + }, + { + "text": "them,", + "start": 78.24, + "end": 78.44, + "confidence": 0.985 + }, + { + "text": "got", + "start": 79.86, + "end": 79.9, + "confidence": 0.992 + }, + { + "text": "them,", + "start": 79.9, + "end": 82.46, + "confidence": 0.985 + }, + { + "text": "got", + "start": 82.46, + "end": 84.44, + "confidence": 0.992 + }, + { + "text": "them", + "start": 84.44, + "end": 84.46, + "confidence": 0.994 + } + ] + }, + { + "id": 5, + "seek": 8500, + "start": 85.2, + "end": 91.86, + "text": " got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them, got them", + "tokens": [ + 50364, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552, + 11, + 658, + 552 + ], + "temperature": 0.0, + "avg_logprob": -0.042715128227199674, + "compression_ratio": 29.52, + "no_speech_prob": 0.6358686685562134, + "confidence": 0.854, + "words": [ + { + "text": "got", + "start": 85.2, + "end": 85.36, + "confidence": 0.0 + }, + { + "text": "them,", + "start": 85.36, + "end": 85.42, + "confidence": 0.024 + }, + { + "text": "got", + "start": 85.68, + "end": 86.68, + "confidence": 0.791 + }, + { + "text": "them,", + "start": 86.68, + "end": 86.82, + "confidence": 0.583 + }, + { + "text": "got", + "start": 87.4, + "end": 87.6, + "confidence": 0.828 + }, + { + "text": "them,", + "start": 87.6, + "end": 88.02, + "confidence": 0.486 + }, + { + "text": "got", + "start": 88.02, + "end": 88.88, + "confidence": 0.881 + }, + { + "text": "them,", + "start": 88.88, + "end": 88.9, + "confidence": 0.425 + }, + { + "text": "got", + "start": 88.92, + "end": 88.94, + "confidence": 0.902 + }, + { + "text": "them,", + "start": 88.94, + "end": 88.96, + "confidence": 0.397 + }, + { + "text": "got", + "start": 88.96, + "end": 88.98, + "confidence": 0.897 + }, + { + "text": "them,", + "start": 88.98, + "end": 89.0, + "confidence": 0.4 + }, + { + "text": "got", + "start": 89.0, + "end": 89.02, + "confidence": 0.869 + }, + { + "text": "them,", + "start": 89.02, + "end": 89.06, + "confidence": 0.47 + }, + { + "text": "got", + "start": 89.18, + "end": 89.2, + "confidence": 0.89 + }, + { + "text": "them,", + "start": 89.2, + "end": 89.22, + "confidence": 0.57 + }, + { + "text": "got", + "start": 89.22, + "end": 89.24, + "confidence": 0.91 + }, + { + "text": "them,", + "start": 89.24, + "end": 89.26, + "confidence": 0.632 + }, + { + "text": "got", + "start": 89.26, + "end": 89.28, + "confidence": 0.598 + }, + { + "text": "them,", + "start": 89.28, + "end": 89.3, + "confidence": 0.743 + }, + { + "text": "got", + "start": 89.3, + "end": 89.32, + "confidence": 0.819 + }, + { + "text": "them,", + "start": 89.32, + "end": 89.34, + "confidence": 0.84 + }, + { + "text": "got", + "start": 89.34, + "end": 89.36, + "confidence": 0.899 + }, + { + "text": "them,", + "start": 89.36, + "end": 89.38, + "confidence": 0.888 + }, + { + "text": "got", + "start": 89.38, + "end": 89.4, + "confidence": 0.918 + }, + { + "text": "them,", + "start": 89.4, + "end": 89.42, + "confidence": 0.914 + }, + { + "text": "got", + "start": 89.42, + "end": 89.44, + "confidence": 0.936 + }, + { + "text": "them,", + "start": 89.44, + "end": 89.46, + "confidence": 0.932 + }, + { + "text": "got", + "start": 89.46, + "end": 89.48, + "confidence": 0.947 + }, + { + "text": "them,", + "start": 89.48, + "end": 89.5, + "confidence": 0.944 + }, + { + "text": "got", + "start": 89.5, + "end": 89.52, + "confidence": 0.953 + }, + { + "text": "them,", + "start": 89.52, + "end": 89.54, + "confidence": 0.945 + }, + { + "text": "got", + "start": 89.54, + "end": 89.56, + "confidence": 0.955 + }, + { + "text": "them,", + "start": 89.56, + "end": 89.58, + "confidence": 0.944 + }, + { + "text": "got", + "start": 89.58, + "end": 89.6, + "confidence": 0.947 + }, + { + "text": "them,", + "start": 89.6, + "end": 89.62, + "confidence": 0.946 + }, + { + "text": "got", + "start": 89.62, + "end": 89.64, + "confidence": 0.94 + }, + { + "text": "them,", + "start": 89.64, + "end": 89.66, + "confidence": 0.952 + }, + { + "text": "got", + "start": 89.66, + "end": 89.68, + "confidence": 0.941 + }, + { + "text": "them,", + "start": 89.68, + "end": 89.7, + "confidence": 0.954 + }, + { + "text": "got", + "start": 89.7, + "end": 89.72, + "confidence": 0.941 + }, + { + "text": "them,", + "start": 89.72, + "end": 89.74, + "confidence": 0.96 + }, + { + "text": "got", + "start": 89.74, + "end": 89.76, + "confidence": 0.941 + }, + { + "text": "them,", + "start": 89.76, + "end": 89.78, + "confidence": 0.963 + }, + { + "text": "got", + "start": 89.78, + "end": 89.8, + "confidence": 0.945 + }, + { + "text": "them,", + "start": 89.8, + "end": 89.82, + "confidence": 0.966 + }, + { + "text": "got", + "start": 89.82, + "end": 89.84, + "confidence": 0.948 + }, + { + "text": "them,", + "start": 89.84, + "end": 89.86, + "confidence": 0.968 + }, + { + "text": "got", + "start": 89.86, + "end": 89.88, + "confidence": 0.95 + }, + { + "text": "them,", + "start": 89.88, + "end": 89.9, + "confidence": 0.971 + }, + { + "text": "got", + "start": 89.9, + "end": 89.92, + "confidence": 0.951 + }, + { + "text": "them,", + "start": 89.92, + "end": 89.94, + "confidence": 0.975 + }, + { + "text": "got", + "start": 89.94, + "end": 89.96, + "confidence": 0.95 + }, + { + "text": "them,", + "start": 89.96, + "end": 89.98, + "confidence": 0.975 + }, + { + "text": "got", + "start": 89.98, + "end": 90.0, + "confidence": 0.951 + }, + { + "text": "them,", + "start": 90.0, + "end": 90.02, + "confidence": 0.977 + }, + { + "text": "got", + "start": 90.02, + "end": 90.04, + "confidence": 0.953 + }, + { + "text": "them,", + "start": 90.04, + "end": 90.06, + "confidence": 0.977 + }, + { + "text": "got", + "start": 90.06, + "end": 90.08, + "confidence": 0.954 + }, + { + "text": "them,", + "start": 90.08, + "end": 90.1, + "confidence": 0.979 + }, + { + "text": "got", + "start": 90.1, + "end": 90.12, + "confidence": 0.955 + }, + { + "text": "them,", + "start": 90.12, + "end": 90.14, + "confidence": 0.979 + }, + { + "text": "got", + "start": 90.14, + "end": 90.16, + "confidence": 0.956 + }, + { + "text": "them,", + "start": 90.16, + "end": 90.18, + "confidence": 0.981 + }, + { + "text": "got", + "start": 90.18, + "end": 90.2, + "confidence": 0.956 + }, + { + "text": "them,", + "start": 90.2, + "end": 90.22, + "confidence": 0.982 + }, + { + "text": "got", + "start": 90.22, + "end": 90.24, + "confidence": 0.958 + }, + { + "text": "them,", + "start": 90.24, + "end": 90.26, + "confidence": 0.982 + }, + { + "text": "got", + "start": 90.26, + "end": 90.28, + "confidence": 0.959 + }, + { + "text": "them,", + "start": 90.28, + "end": 90.3, + "confidence": 0.982 + }, + { + "text": "got", + "start": 90.3, + "end": 90.32, + "confidence": 0.961 + }, + { + "text": "them,", + "start": 90.32, + "end": 90.34, + "confidence": 0.982 + }, + { + "text": "got", + "start": 90.34, + "end": 90.36, + "confidence": 0.963 + }, + { + "text": "them,", + "start": 90.36, + "end": 90.38, + "confidence": 0.984 + }, + { + "text": "got", + "start": 90.38, + "end": 90.4, + "confidence": 0.964 + }, + { + "text": "them,", + "start": 90.4, + "end": 90.42, + "confidence": 0.984 + }, + { + "text": "got", + "start": 90.42, + "end": 90.44, + "confidence": 0.966 + }, + { + "text": "them,", + "start": 90.44, + "end": 90.46, + "confidence": 0.985 + }, + { + "text": "got", + "start": 90.46, + "end": 90.48, + "confidence": 0.968 + }, + { + "text": "them,", + "start": 90.48, + "end": 90.5, + "confidence": 0.985 + }, + { + "text": "got", + "start": 90.5, + "end": 90.52, + "confidence": 0.969 + }, + { + "text": "them,", + "start": 90.52, + "end": 90.54, + "confidence": 0.986 + }, + { + "text": "got", + "start": 90.54, + "end": 90.56, + "confidence": 0.971 + }, + { + "text": "them,", + "start": 90.56, + "end": 90.58, + "confidence": 0.986 + }, + { + "text": "got", + "start": 90.58, + "end": 90.6, + "confidence": 0.973 + }, + { + "text": "them,", + "start": 90.6, + "end": 90.62, + "confidence": 0.987 + }, + { + "text": "got", + "start": 90.62, + "end": 90.64, + "confidence": 0.974 + }, + { + "text": "them,", + "start": 90.64, + "end": 90.66, + "confidence": 0.987 + }, + { + "text": "got", + "start": 90.66, + "end": 90.68, + "confidence": 0.976 + }, + { + "text": "them,", + "start": 90.68, + "end": 90.7, + "confidence": 0.987 + }, + { + "text": "got", + "start": 90.7, + "end": 90.72, + "confidence": 0.979 + }, + { + "text": "them,", + "start": 90.72, + "end": 90.74, + "confidence": 0.988 + }, + { + "text": "got", + "start": 90.74, + "end": 90.76, + "confidence": 0.98 + }, + { + "text": "them,", + "start": 90.76, + "end": 90.78, + "confidence": 0.989 + }, + { + "text": "got", + "start": 90.78, + "end": 90.8, + "confidence": 0.981 + }, + { + "text": "them,", + "start": 90.8, + "end": 90.82, + "confidence": 0.989 + }, + { + "text": "got", + "start": 90.82, + "end": 90.84, + "confidence": 0.983 + }, + { + "text": "them,", + "start": 90.84, + "end": 90.86, + "confidence": 0.989 + }, + { + "text": "got", + "start": 90.86, + "end": 90.88, + "confidence": 0.985 + }, + { + "text": "them,", + "start": 90.88, + "end": 90.9, + "confidence": 0.99 + }, + { + "text": "got", + "start": 90.9, + "end": 90.92, + "confidence": 0.986 + }, + { + "text": "them,", + "start": 90.92, + "end": 90.94, + "confidence": 0.99 + }, + { + "text": "got", + "start": 90.94, + "end": 90.96, + "confidence": 0.987 + }, + { + "text": "them,", + "start": 90.96, + "end": 90.98, + "confidence": 0.991 + }, + { + "text": "got", + "start": 90.98, + "end": 91.0, + "confidence": 0.988 + }, + { + "text": "them,", + "start": 91.0, + "end": 91.02, + "confidence": 0.991 + }, + { + "text": "got", + "start": 91.02, + "end": 91.04, + "confidence": 0.989 + }, + { + "text": "them,", + "start": 91.04, + "end": 91.06, + "confidence": 0.991 + }, + { + "text": "got", + "start": 91.06, + "end": 91.08, + "confidence": 0.99 + }, + { + "text": "them,", + "start": 91.08, + "end": 91.1, + "confidence": 0.992 + }, + { + "text": "got", + "start": 91.1, + "end": 91.12, + "confidence": 0.99 + }, + { + "text": "them,", + "start": 91.12, + "end": 91.14, + "confidence": 0.992 + }, + { + "text": "got", + "start": 91.14, + "end": 91.16, + "confidence": 0.991 + }, + { + "text": "them,", + "start": 91.16, + "end": 91.18, + "confidence": 0.992 + }, + { + "text": "got", + "start": 91.18, + "end": 91.2, + "confidence": 0.992 + }, + { + "text": "them,", + "start": 91.2, + "end": 91.22, + "confidence": 0.992 + }, + { + "text": "got", + "start": 91.22, + "end": 91.24, + "confidence": 0.993 + }, + { + "text": "them,", + "start": 91.24, + "end": 91.26, + "confidence": 0.993 + }, + { + "text": "got", + "start": 91.26, + "end": 91.28, + "confidence": 0.993 + }, + { + "text": "them,", + "start": 91.28, + "end": 91.3, + "confidence": 0.992 + }, + { + "text": "got", + "start": 91.3, + "end": 91.32, + "confidence": 0.993 + }, + { + "text": "them,", + "start": 91.32, + "end": 91.34, + "confidence": 0.993 + }, + { + "text": "got", + "start": 91.34, + "end": 91.36, + "confidence": 0.993 + }, + { + "text": "them,", + "start": 91.36, + "end": 91.38, + "confidence": 0.993 + }, + { + "text": "got", + "start": 91.38, + "end": 91.4, + "confidence": 0.994 + }, + { + "text": "them,", + "start": 91.4, + "end": 91.42, + "confidence": 0.993 + }, + { + "text": "got", + "start": 91.42, + "end": 91.44, + "confidence": 0.994 + }, + { + "text": "them,", + "start": 91.44, + "end": 91.46, + "confidence": 0.993 + }, + { + "text": "got", + "start": 91.46, + "end": 91.48, + "confidence": 0.994 + }, + { + "text": "them,", + "start": 91.48, + "end": 91.5, + "confidence": 0.993 + }, + { + "text": "got", + "start": 91.5, + "end": 91.52, + "confidence": 0.994 + }, + { + "text": "them,", + "start": 91.52, + "end": 91.54, + "confidence": 0.993 + }, + { + "text": "got", + "start": 91.54, + "end": 91.56, + "confidence": 0.994 + }, + { + "text": "them,", + "start": 91.56, + "end": 91.58, + "confidence": 0.994 + }, + { + "text": "got", + "start": 91.58, + "end": 91.6, + "confidence": 0.995 + }, + { + "text": "them,", + "start": 91.6, + "end": 91.62, + "confidence": 0.994 + }, + { + "text": "got", + "start": 91.62, + "end": 91.64, + "confidence": 0.995 + }, + { + "text": "them,", + "start": 91.64, + "end": 91.66, + "confidence": 0.994 + }, + { + "text": "got", + "start": 91.66, + "end": 91.68, + "confidence": 0.995 + }, + { + "text": "them,", + "start": 91.68, + "end": 91.7, + "confidence": 0.994 + }, + { + "text": "got", + "start": 91.7, + "end": 91.72, + "confidence": 0.995 + }, + { + "text": "them,", + "start": 91.72, + "end": 91.74, + "confidence": 0.994 + }, + { + "text": "got", + "start": 91.74, + "end": 91.76, + "confidence": 0.995 + }, + { + "text": "them,", + "start": 91.76, + "end": 91.78, + "confidence": 0.994 + }, + { + "text": "got", + "start": 91.78, + "end": 91.8, + "confidence": 0.995 + }, + { + "text": "them,", + "start": 91.8, + "end": 91.82, + "confidence": 0.994 + }, + { + "text": "got", + "start": 91.82, + "end": 91.84, + "confidence": 0.995 + }, + { + "text": "them", + "start": 91.84, + "end": 91.86, + "confidence": 0.998 + } + ] + } + ], + "language": "en" +} \ No newline at end of file diff --git a/tests/expected/punctuations_no/bonjour.wav.csv b/tests/expected/punctuations_no/bonjour.wav.csv new file mode 100644 index 0000000000000000000000000000000000000000..515648b4ee80e092404f6e79d04d7028cefdae78 --- /dev/null +++ b/tests/expected/punctuations_no/bonjour.wav.csv @@ -0,0 +1 @@ +Bonjour !,0.14,0.94 diff --git a/tests/expected/punctuations_no/bonjour.wav.srt b/tests/expected/punctuations_no/bonjour.wav.srt new file mode 100644 index 0000000000000000000000000000000000000000..d8d205dc3daf944fcf8cbd38edc5f45287fb5510 --- /dev/null +++ b/tests/expected/punctuations_no/bonjour.wav.srt @@ -0,0 +1,4 @@ +1 +00:00:00,140 --> 00:00:00,940 +Bonjour ! + diff --git a/tests/expected/punctuations_no/bonjour.wav.tsv b/tests/expected/punctuations_no/bonjour.wav.tsv new file mode 100644 index 0000000000000000000000000000000000000000..4244f49ea0e650559f762b334550dd60e0a2f2a6 --- /dev/null +++ b/tests/expected/punctuations_no/bonjour.wav.tsv @@ -0,0 +1,2 @@ +start end text +140 940 Bonjour ! diff --git a/tests/expected/punctuations_no/bonjour.wav.txt b/tests/expected/punctuations_no/bonjour.wav.txt new file mode 100644 index 0000000000000000000000000000000000000000..6625d5f9893711f1c711cc5a3695219d1f4d9cc4 --- /dev/null +++ b/tests/expected/punctuations_no/bonjour.wav.txt @@ -0,0 +1 @@ +Bonjour ! diff --git a/tests/expected/punctuations_no/bonjour.wav.vtt b/tests/expected/punctuations_no/bonjour.wav.vtt new file mode 100644 index 0000000000000000000000000000000000000000..ecc03120fcb44b8ed669288169bdae00ce0c79ec --- /dev/null +++ b/tests/expected/punctuations_no/bonjour.wav.vtt @@ -0,0 +1,7 @@ +WEBVTT + +WEBVTT + +00:00.140 --> 00:00.940 +Bonjour ! + diff --git a/tests/expected/punctuations_no/bonjour.wav.words.csv b/tests/expected/punctuations_no/bonjour.wav.words.csv new file mode 100644 index 0000000000000000000000000000000000000000..c164f6417663f8765245f8e23022ad85080f7941 --- /dev/null +++ b/tests/expected/punctuations_no/bonjour.wav.words.csv @@ -0,0 +1 @@ +Bonjour,0.14,0.94 diff --git a/tests/expected/punctuations_no/bonjour.wav.words.json b/tests/expected/punctuations_no/bonjour.wav.words.json new file mode 100644 index 0000000000000000000000000000000000000000..16f8fddd1de9409ecc8426f5bd914f21d902393c --- /dev/null +++ b/tests/expected/punctuations_no/bonjour.wav.words.json @@ -0,0 +1,32 @@ +{ + "text": " Bonjour !", + "segments": [ + { + "id": 0, + "seek": 0, + "start": 0.14, + "end": 0.94, + "text": " Bonjour !", + "tokens": [ + 50364, + 25431, + 2298, + 50402 + ], + "temperature": 0.0, + "avg_logprob": -0.7046648502349854, + "compression_ratio": 0.5294117647058824, + "no_speech_prob": 0.08610370755195618, + "confidence": 0.964, + "words": [ + { + "text": "Bonjour", + "start": 0.14, + "end": 0.94, + "confidence": 0.964 + } + ] + } + ], + "language": "fr" +} \ No newline at end of file diff --git a/tests/expected/punctuations_no/bonjour.wav.words.srt b/tests/expected/punctuations_no/bonjour.wav.words.srt new file mode 100644 index 0000000000000000000000000000000000000000..cd14abb1f5b082f428f7e68574088414fa661db8 --- /dev/null +++ b/tests/expected/punctuations_no/bonjour.wav.words.srt @@ -0,0 +1,4 @@ +1 +00:00:00,140 --> 00:00:00,940 +Bonjour + diff --git a/tests/expected/punctuations_no/bonjour.wav.words.tsv b/tests/expected/punctuations_no/bonjour.wav.words.tsv new file mode 100644 index 0000000000000000000000000000000000000000..2ddd00966ddffa056b18e3903294c7ef5795ffe1 --- /dev/null +++ b/tests/expected/punctuations_no/bonjour.wav.words.tsv @@ -0,0 +1,2 @@ +start end text +140 940 Bonjour diff --git a/tests/expected/punctuations_no/bonjour.wav.words.vtt b/tests/expected/punctuations_no/bonjour.wav.words.vtt new file mode 100644 index 0000000000000000000000000000000000000000..a3ce34860a05ec1125085a02e60a5eac85458c72 --- /dev/null +++ b/tests/expected/punctuations_no/bonjour.wav.words.vtt @@ -0,0 +1,7 @@ +WEBVTT + +WEBVTT + +00:00.140 --> 00:00.940 +Bonjour + diff --git a/tests/expected/punctuations_no/punctuations.mp3.csv b/tests/expected/punctuations_no/punctuations.mp3.csv new file mode 100644 index 0000000000000000000000000000000000000000..32a9d46e0d6565dc2b2aa8bc1bc5c2958fad26f9 --- /dev/null +++ b/tests/expected/punctuations_no/punctuations.mp3.csv @@ -0,0 +1 @@ +"Dis-moi, est-ce que l'avion vole ?",0.38,2.76 diff --git a/tests/expected/punctuations_no/punctuations.mp3.srt b/tests/expected/punctuations_no/punctuations.mp3.srt new file mode 100644 index 0000000000000000000000000000000000000000..877851ff9664283f0877d16b24551fa2d7a88226 --- /dev/null +++ b/tests/expected/punctuations_no/punctuations.mp3.srt @@ -0,0 +1,4 @@ +1 +00:00:00,380 --> 00:00:02,760 +Dis-moi, est-ce que l'avion vole ? + diff --git a/tests/expected/punctuations_no/punctuations.mp3.tsv b/tests/expected/punctuations_no/punctuations.mp3.tsv new file mode 100644 index 0000000000000000000000000000000000000000..58cf737627008302c822b962a66b0b7e46a3a1de --- /dev/null +++ b/tests/expected/punctuations_no/punctuations.mp3.tsv @@ -0,0 +1,2 @@ +start end text +380 2760 Dis-moi, est-ce que l'avion vole ? diff --git a/tests/expected/punctuations_no/punctuations.mp3.txt b/tests/expected/punctuations_no/punctuations.mp3.txt new file mode 100644 index 0000000000000000000000000000000000000000..6490b685ff0adf8d95873de48095732fd91c30fd --- /dev/null +++ b/tests/expected/punctuations_no/punctuations.mp3.txt @@ -0,0 +1 @@ +Dis-moi, est-ce que l'avion vole ? diff --git a/tests/expected/punctuations_no/punctuations.mp3.vtt b/tests/expected/punctuations_no/punctuations.mp3.vtt new file mode 100644 index 0000000000000000000000000000000000000000..8397a28e233bce3dbd3ddbf7a4226bf3c210e870 --- /dev/null +++ b/tests/expected/punctuations_no/punctuations.mp3.vtt @@ -0,0 +1,7 @@ +WEBVTT + +WEBVTT + +00:00.380 --> 00:02.760 +Dis-moi, est-ce que l'avion vole ? + diff --git a/tests/expected/punctuations_no/punctuations.mp3.words.csv b/tests/expected/punctuations_no/punctuations.mp3.words.csv new file mode 100644 index 0000000000000000000000000000000000000000..e5fbcbf2c422d3c24608bdcea9f55eb45171a093 --- /dev/null +++ b/tests/expected/punctuations_no/punctuations.mp3.words.csv @@ -0,0 +1,5 @@ +Dis-moi,0.38,1.1 +est-ce,1.28,1.5 +que,1.5,1.66 +l'avion,1.66,2.04 +vole,2.04,2.76 diff --git a/tests/expected/punctuations_no/punctuations.mp3.words.json b/tests/expected/punctuations_no/punctuations.mp3.words.json new file mode 100644 index 0000000000000000000000000000000000000000..e4ff96e3ad4a9ed767427d7c70a4e020f8bf667d --- /dev/null +++ b/tests/expected/punctuations_no/punctuations.mp3.words.json @@ -0,0 +1,68 @@ +{ + "text": " Dis-moi, est-ce que l'avion vole ?", + "segments": [ + { + "id": 0, + "seek": 0, + "start": 0.38, + "end": 2.76, + "text": " Dis-moi, est-ce que l'avion vole ?", + "tokens": [ + 50364, + 4208, + 12, + 29292, + 11, + 871, + 12, + 384, + 631, + 287, + 6, + 706, + 313, + 49877, + 2506, + 50496 + ], + "temperature": 0.0, + "avg_logprob": -0.26327380012063417, + "compression_ratio": 0.8095238095238095, + "no_speech_prob": 0.03882359713315964, + "confidence": 0.928, + "words": [ + { + "text": "Dis-moi", + "start": 0.38, + "end": 1.1, + "confidence": 0.809 + }, + { + "text": "est-ce", + "start": 1.28, + "end": 1.5, + "confidence": 0.968 + }, + { + "text": "que", + "start": 1.5, + "end": 1.66, + "confidence": 0.978 + }, + { + "text": "l'avion", + "start": 1.66, + "end": 2.04, + "confidence": 0.993 + }, + { + "text": "vole", + "start": 2.04, + "end": 2.76, + "confidence": 0.898 + } + ] + } + ], + "language": "fr" +} \ No newline at end of file diff --git a/tests/expected/punctuations_no/punctuations.mp3.words.srt b/tests/expected/punctuations_no/punctuations.mp3.words.srt new file mode 100644 index 0000000000000000000000000000000000000000..9a0041e682bad02b37134d8a0d764cd07b64f608 --- /dev/null +++ b/tests/expected/punctuations_no/punctuations.mp3.words.srt @@ -0,0 +1,20 @@ +1 +00:00:00,380 --> 00:00:01,100 +Dis-moi + +2 +00:00:01,280 --> 00:00:01,500 +est-ce + +3 +00:00:01,500 --> 00:00:01,660 +que + +4 +00:00:01,660 --> 00:00:02,040 +l'avion + +5 +00:00:02,040 --> 00:00:02,760 +vole + diff --git a/tests/expected/punctuations_no/punctuations.mp3.words.tsv b/tests/expected/punctuations_no/punctuations.mp3.words.tsv new file mode 100644 index 0000000000000000000000000000000000000000..a9613c4fe6697b2aa5ea56eecd09fb9c18d32210 --- /dev/null +++ b/tests/expected/punctuations_no/punctuations.mp3.words.tsv @@ -0,0 +1,6 @@ +start end text +380 1100 Dis-moi +1280 1500 est-ce +1500 1660 que +1660 2040 l'avion +2040 2760 vole diff --git a/tests/expected/punctuations_no/punctuations.mp3.words.vtt b/tests/expected/punctuations_no/punctuations.mp3.words.vtt new file mode 100644 index 0000000000000000000000000000000000000000..fc6f8a3b6558650512d59fcdc3ce41735b03176d --- /dev/null +++ b/tests/expected/punctuations_no/punctuations.mp3.words.vtt @@ -0,0 +1,19 @@ +WEBVTT + +WEBVTT + +00:00.380 --> 00:01.100 +Dis-moi + +00:01.280 --> 00:01.500 +est-ce + +00:01.500 --> 00:01.660 +que + +00:01.660 --> 00:02.040 +l'avion + +00:02.040 --> 00:02.760 +vole + diff --git a/tests/expected/punctuations_yes/bonjour.wav.csv b/tests/expected/punctuations_yes/bonjour.wav.csv new file mode 100644 index 0000000000000000000000000000000000000000..515648b4ee80e092404f6e79d04d7028cefdae78 --- /dev/null +++ b/tests/expected/punctuations_yes/bonjour.wav.csv @@ -0,0 +1 @@ +Bonjour !,0.14,0.94 diff --git a/tests/expected/punctuations_yes/bonjour.wav.srt b/tests/expected/punctuations_yes/bonjour.wav.srt new file mode 100644 index 0000000000000000000000000000000000000000..d8d205dc3daf944fcf8cbd38edc5f45287fb5510 --- /dev/null +++ b/tests/expected/punctuations_yes/bonjour.wav.srt @@ -0,0 +1,4 @@ +1 +00:00:00,140 --> 00:00:00,940 +Bonjour ! + diff --git a/tests/expected/punctuations_yes/bonjour.wav.tsv b/tests/expected/punctuations_yes/bonjour.wav.tsv new file mode 100644 index 0000000000000000000000000000000000000000..4244f49ea0e650559f762b334550dd60e0a2f2a6 --- /dev/null +++ b/tests/expected/punctuations_yes/bonjour.wav.tsv @@ -0,0 +1,2 @@ +start end text +140 940 Bonjour ! diff --git a/tests/expected/punctuations_yes/bonjour.wav.txt b/tests/expected/punctuations_yes/bonjour.wav.txt new file mode 100644 index 0000000000000000000000000000000000000000..6625d5f9893711f1c711cc5a3695219d1f4d9cc4 --- /dev/null +++ b/tests/expected/punctuations_yes/bonjour.wav.txt @@ -0,0 +1 @@ +Bonjour ! diff --git a/tests/expected/punctuations_yes/bonjour.wav.vtt b/tests/expected/punctuations_yes/bonjour.wav.vtt new file mode 100644 index 0000000000000000000000000000000000000000..ecc03120fcb44b8ed669288169bdae00ce0c79ec --- /dev/null +++ b/tests/expected/punctuations_yes/bonjour.wav.vtt @@ -0,0 +1,7 @@ +WEBVTT + +WEBVTT + +00:00.140 --> 00:00.940 +Bonjour ! + diff --git a/tests/expected/punctuations_yes/bonjour.wav.words.csv b/tests/expected/punctuations_yes/bonjour.wav.words.csv new file mode 100644 index 0000000000000000000000000000000000000000..515648b4ee80e092404f6e79d04d7028cefdae78 --- /dev/null +++ b/tests/expected/punctuations_yes/bonjour.wav.words.csv @@ -0,0 +1 @@ +Bonjour !,0.14,0.94 diff --git a/tests/expected/punctuations_yes/bonjour.wav.words.json b/tests/expected/punctuations_yes/bonjour.wav.words.json new file mode 100644 index 0000000000000000000000000000000000000000..1539b7c83897fb3c4c929768b3ef7782d28c3f37 --- /dev/null +++ b/tests/expected/punctuations_yes/bonjour.wav.words.json @@ -0,0 +1,32 @@ +{ + "text": " Bonjour !", + "segments": [ + { + "id": 0, + "seek": 0, + "start": 0.14, + "end": 0.94, + "text": " Bonjour !", + "tokens": [ + 50364, + 25431, + 2298, + 50402 + ], + "temperature": 0.0, + "avg_logprob": -0.7046648502349854, + "compression_ratio": 0.5294117647058824, + "no_speech_prob": 0.08610370755195618, + "confidence": 0.964, + "words": [ + { + "text": "Bonjour !", + "start": 0.14, + "end": 0.94, + "confidence": 0.964 + } + ] + } + ], + "language": "fr" +} \ No newline at end of file diff --git a/tests/expected/punctuations_yes/bonjour.wav.words.srt b/tests/expected/punctuations_yes/bonjour.wav.words.srt new file mode 100644 index 0000000000000000000000000000000000000000..d8d205dc3daf944fcf8cbd38edc5f45287fb5510 --- /dev/null +++ b/tests/expected/punctuations_yes/bonjour.wav.words.srt @@ -0,0 +1,4 @@ +1 +00:00:00,140 --> 00:00:00,940 +Bonjour ! + diff --git a/tests/expected/punctuations_yes/bonjour.wav.words.tsv b/tests/expected/punctuations_yes/bonjour.wav.words.tsv new file mode 100644 index 0000000000000000000000000000000000000000..4244f49ea0e650559f762b334550dd60e0a2f2a6 --- /dev/null +++ b/tests/expected/punctuations_yes/bonjour.wav.words.tsv @@ -0,0 +1,2 @@ +start end text +140 940 Bonjour ! diff --git a/tests/expected/punctuations_yes/bonjour.wav.words.vtt b/tests/expected/punctuations_yes/bonjour.wav.words.vtt new file mode 100644 index 0000000000000000000000000000000000000000..ecc03120fcb44b8ed669288169bdae00ce0c79ec --- /dev/null +++ b/tests/expected/punctuations_yes/bonjour.wav.words.vtt @@ -0,0 +1,7 @@ +WEBVTT + +WEBVTT + +00:00.140 --> 00:00.940 +Bonjour ! + diff --git a/tests/expected/punctuations_yes/punctuations.mp3.csv b/tests/expected/punctuations_yes/punctuations.mp3.csv new file mode 100644 index 0000000000000000000000000000000000000000..32a9d46e0d6565dc2b2aa8bc1bc5c2958fad26f9 --- /dev/null +++ b/tests/expected/punctuations_yes/punctuations.mp3.csv @@ -0,0 +1 @@ +"Dis-moi, est-ce que l'avion vole ?",0.38,2.76 diff --git a/tests/expected/punctuations_yes/punctuations.mp3.srt b/tests/expected/punctuations_yes/punctuations.mp3.srt new file mode 100644 index 0000000000000000000000000000000000000000..877851ff9664283f0877d16b24551fa2d7a88226 --- /dev/null +++ b/tests/expected/punctuations_yes/punctuations.mp3.srt @@ -0,0 +1,4 @@ +1 +00:00:00,380 --> 00:00:02,760 +Dis-moi, est-ce que l'avion vole ? + diff --git a/tests/expected/punctuations_yes/punctuations.mp3.tsv b/tests/expected/punctuations_yes/punctuations.mp3.tsv new file mode 100644 index 0000000000000000000000000000000000000000..58cf737627008302c822b962a66b0b7e46a3a1de --- /dev/null +++ b/tests/expected/punctuations_yes/punctuations.mp3.tsv @@ -0,0 +1,2 @@ +start end text +380 2760 Dis-moi, est-ce que l'avion vole ? diff --git a/tests/expected/punctuations_yes/punctuations.mp3.txt b/tests/expected/punctuations_yes/punctuations.mp3.txt new file mode 100644 index 0000000000000000000000000000000000000000..6490b685ff0adf8d95873de48095732fd91c30fd --- /dev/null +++ b/tests/expected/punctuations_yes/punctuations.mp3.txt @@ -0,0 +1 @@ +Dis-moi, est-ce que l'avion vole ? diff --git a/tests/expected/punctuations_yes/punctuations.mp3.vtt b/tests/expected/punctuations_yes/punctuations.mp3.vtt new file mode 100644 index 0000000000000000000000000000000000000000..8397a28e233bce3dbd3ddbf7a4226bf3c210e870 --- /dev/null +++ b/tests/expected/punctuations_yes/punctuations.mp3.vtt @@ -0,0 +1,7 @@ +WEBVTT + +WEBVTT + +00:00.380 --> 00:02.760 +Dis-moi, est-ce que l'avion vole ? + diff --git a/tests/expected/punctuations_yes/punctuations.mp3.words.csv b/tests/expected/punctuations_yes/punctuations.mp3.words.csv new file mode 100644 index 0000000000000000000000000000000000000000..6d6a4383de2f4c469a0fc0048edda5d5d3cfc3e9 --- /dev/null +++ b/tests/expected/punctuations_yes/punctuations.mp3.words.csv @@ -0,0 +1,5 @@ +"Dis-moi,",0.38,1.1 +est-ce,1.28,1.5 +que,1.5,1.66 +l'avion,1.66,2.04 +vole ?,2.04,2.76 diff --git a/tests/expected/punctuations_yes/punctuations.mp3.words.json b/tests/expected/punctuations_yes/punctuations.mp3.words.json new file mode 100644 index 0000000000000000000000000000000000000000..ea6d774cf345132b175fedfe5a717c4cd27cc3aa --- /dev/null +++ b/tests/expected/punctuations_yes/punctuations.mp3.words.json @@ -0,0 +1,68 @@ +{ + "text": " Dis-moi, est-ce que l'avion vole ?", + "segments": [ + { + "id": 0, + "seek": 0, + "start": 0.38, + "end": 2.76, + "text": " Dis-moi, est-ce que l'avion vole ?", + "tokens": [ + 50364, + 4208, + 12, + 29292, + 11, + 871, + 12, + 384, + 631, + 287, + 6, + 706, + 313, + 49877, + 2506, + 50496 + ], + "temperature": 0.0, + "avg_logprob": -0.26327380012063417, + "compression_ratio": 0.8095238095238095, + "no_speech_prob": 0.03882359713315964, + "confidence": 0.928, + "words": [ + { + "text": "Dis-moi,", + "start": 0.38, + "end": 1.1, + "confidence": 0.809 + }, + { + "text": "est-ce", + "start": 1.28, + "end": 1.5, + "confidence": 0.968 + }, + { + "text": "que", + "start": 1.5, + "end": 1.66, + "confidence": 0.978 + }, + { + "text": "l'avion", + "start": 1.66, + "end": 2.04, + "confidence": 0.993 + }, + { + "text": "vole ?", + "start": 2.04, + "end": 2.76, + "confidence": 0.898 + } + ] + } + ], + "language": "fr" +} \ No newline at end of file diff --git a/tests/expected/punctuations_yes/punctuations.mp3.words.srt b/tests/expected/punctuations_yes/punctuations.mp3.words.srt new file mode 100644 index 0000000000000000000000000000000000000000..91c0fbf35dff3f5043392a4b6035510d073372d4 --- /dev/null +++ b/tests/expected/punctuations_yes/punctuations.mp3.words.srt @@ -0,0 +1,20 @@ +1 +00:00:00,380 --> 00:00:01,100 +Dis-moi, + +2 +00:00:01,280 --> 00:00:01,500 +est-ce + +3 +00:00:01,500 --> 00:00:01,660 +que + +4 +00:00:01,660 --> 00:00:02,040 +l'avion + +5 +00:00:02,040 --> 00:00:02,760 +vole ? + diff --git a/tests/expected/punctuations_yes/punctuations.mp3.words.tsv b/tests/expected/punctuations_yes/punctuations.mp3.words.tsv new file mode 100644 index 0000000000000000000000000000000000000000..f267961f36fcab7036a58e7e979625d89df087e4 --- /dev/null +++ b/tests/expected/punctuations_yes/punctuations.mp3.words.tsv @@ -0,0 +1,6 @@ +start end text +380 1100 Dis-moi, +1280 1500 est-ce +1500 1660 que +1660 2040 l'avion +2040 2760 vole ? diff --git a/tests/expected/punctuations_yes/punctuations.mp3.words.vtt b/tests/expected/punctuations_yes/punctuations.mp3.words.vtt new file mode 100644 index 0000000000000000000000000000000000000000..0a2cdcec1b994bb7512933594d72181013183838 --- /dev/null +++ b/tests/expected/punctuations_yes/punctuations.mp3.words.vtt @@ -0,0 +1,19 @@ +WEBVTT + +WEBVTT + +00:00.380 --> 00:01.100 +Dis-moi, + +00:01.280 --> 00:01.500 +est-ce + +00:01.500 --> 00:01.660 +que + +00:01.660 --> 00:02.040 +l'avion + +00:02.040 --> 00:02.760 +vole ? + diff --git a/tests/expected/small.en.cpu/arabic.mp3.words.json b/tests/expected/small.en.cpu/arabic.mp3.words.json new file mode 100644 index 0000000000000000000000000000000000000000..acb72a1674c019af75523e14dc77422914030a68 --- /dev/null +++ b/tests/expected/small.en.cpu/arabic.mp3.words.json @@ -0,0 +1,3346 @@ +{ + "text": " I am the one who is the one who is the one who is the one who is the one who is the one I am the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is", + "segments": [ + { + "id": 0, + "seek": 0, + "start": 1.0, + "end": 7.72, + "text": " I am the one who is the one who is the one who is the one who is the one who is the one", + "tokens": [ + 314, + 716, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530 + ], + "temperature": 0.0, + "avg_logprob": -0.23478534274631077, + "compression_ratio": 24.294117647058822, + "no_speech_prob": 0.6507940292358398, + "confidence": 0.358, + "words": [ + { + "text": "I", + "start": 1.0, + "end": 3.16, + "confidence": 0.053 + }, + { + "text": "am", + "start": 3.16, + "end": 4.04, + "confidence": 0.152 + }, + { + "text": "the", + "start": 4.04, + "end": 4.08, + "confidence": 0.143 + }, + { + "text": "one", + "start": 4.08, + "end": 6.1, + "confidence": 0.085 + }, + { + "text": "who", + "start": 6.1, + "end": 6.28, + "confidence": 0.718 + }, + { + "text": "is", + "start": 6.28, + "end": 6.32, + "confidence": 0.12 + }, + { + "text": "the", + "start": 6.32, + "end": 6.36, + "confidence": 0.134 + }, + { + "text": "one", + "start": 6.36, + "end": 6.4, + "confidence": 0.204 + }, + { + "text": "who", + "start": 6.4, + "end": 6.44, + "confidence": 0.618 + }, + { + "text": "is", + "start": 6.44, + "end": 6.96, + "confidence": 0.319 + }, + { + "text": "the", + "start": 6.96, + "end": 7.0, + "confidence": 0.382 + }, + { + "text": "one", + "start": 7.0, + "end": 7.24, + "confidence": 0.443 + }, + { + "text": "who", + "start": 7.24, + "end": 7.28, + "confidence": 0.448 + }, + { + "text": "is", + "start": 7.28, + "end": 7.32, + "confidence": 0.518 + }, + { + "text": "the", + "start": 7.32, + "end": 7.36, + "confidence": 0.543 + }, + { + "text": "one", + "start": 7.36, + "end": 7.4, + "confidence": 0.723 + }, + { + "text": "who", + "start": 7.4, + "end": 7.44, + "confidence": 0.433 + }, + { + "text": "is", + "start": 7.44, + "end": 7.48, + "confidence": 0.678 + }, + { + "text": "the", + "start": 7.48, + "end": 7.52, + "confidence": 0.636 + }, + { + "text": "one", + "start": 7.52, + "end": 7.56, + "confidence": 0.817 + }, + { + "text": "who", + "start": 7.56, + "end": 7.6, + "confidence": 0.505 + }, + { + "text": "is", + "start": 7.6, + "end": 7.64, + "confidence": 0.74 + }, + { + "text": "the", + "start": 7.64, + "end": 7.68, + "confidence": 0.697 + }, + { + "text": "one", + "start": 7.68, + "end": 7.72, + "confidence": 0.698 + } + ] + }, + { + "id": 1, + "seek": 700, + "start": 7.72, + "end": 37.02, + "text": " I am the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the", + "tokens": [ + 50363, + 314, + 716, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262 + ], + "temperature": 0.0, + "avg_logprob": -0.06210707770453559, + "compression_ratio": 24.5, + "no_speech_prob": 3.115955405519344e-05, + "confidence": 0.939, + "words": [ + { + "text": "I", + "start": 7.72, + "end": 9.42, + "confidence": 0.22 + }, + { + "text": "am", + "start": 9.42, + "end": 12.1, + "confidence": 0.81 + }, + { + "text": "the", + "start": 12.1, + "end": 12.48, + "confidence": 0.872 + }, + { + "text": "one", + "start": 12.48, + "end": 12.58, + "confidence": 0.927 + }, + { + "text": "who", + "start": 12.58, + "end": 13.4, + "confidence": 0.966 + }, + { + "text": "is", + "start": 13.4, + "end": 13.96, + "confidence": 0.934 + }, + { + "text": "the", + "start": 13.96, + "end": 14.56, + "confidence": 0.968 + }, + { + "text": "one", + "start": 14.56, + "end": 14.6, + "confidence": 0.989 + }, + { + "text": "who", + "start": 14.6, + "end": 14.64, + "confidence": 0.951 + }, + { + "text": "is", + "start": 14.64, + "end": 14.68, + "confidence": 0.965 + }, + { + "text": "the", + "start": 14.68, + "end": 15.04, + "confidence": 0.977 + }, + { + "text": "one", + "start": 15.04, + "end": 17.78, + "confidence": 0.993 + }, + { + "text": "who", + "start": 17.78, + "end": 17.82, + "confidence": 0.843 + }, + { + "text": "is", + "start": 17.82, + "end": 18.58, + "confidence": 0.977 + }, + { + "text": "the", + "start": 18.58, + "end": 18.62, + "confidence": 0.979 + }, + { + "text": "one", + "start": 18.62, + "end": 18.66, + "confidence": 0.991 + }, + { + "text": "who", + "start": 18.66, + "end": 19.46, + "confidence": 0.694 + }, + { + "text": "is", + "start": 19.46, + "end": 20.9, + "confidence": 0.979 + }, + { + "text": "the", + "start": 20.9, + "end": 20.94, + "confidence": 0.978 + }, + { + "text": "one", + "start": 20.94, + "end": 20.98, + "confidence": 0.99 + }, + { + "text": "who", + "start": 20.98, + "end": 21.02, + "confidence": 0.657 + }, + { + "text": "is", + "start": 21.02, + "end": 21.06, + "confidence": 0.977 + }, + { + "text": "the", + "start": 21.06, + "end": 21.52, + "confidence": 0.974 + }, + { + "text": "one", + "start": 21.52, + "end": 21.56, + "confidence": 0.983 + }, + { + "text": "who", + "start": 21.56, + "end": 21.6, + "confidence": 0.609 + }, + { + "text": "is", + "start": 21.6, + "end": 22.04, + "confidence": 0.978 + }, + { + "text": "the", + "start": 22.04, + "end": 22.5, + "confidence": 0.966 + }, + { + "text": "one", + "start": 22.5, + "end": 23.6, + "confidence": 0.986 + }, + { + "text": "who", + "start": 23.6, + "end": 24.76, + "confidence": 0.624 + }, + { + "text": "is", + "start": 24.76, + "end": 26.18, + "confidence": 0.978 + }, + { + "text": "the", + "start": 26.18, + "end": 26.8, + "confidence": 0.962 + }, + { + "text": "one", + "start": 26.8, + "end": 26.84, + "confidence": 0.984 + }, + { + "text": "who", + "start": 26.84, + "end": 26.88, + "confidence": 0.679 + }, + { + "text": "is", + "start": 26.88, + "end": 27.4, + "confidence": 0.978 + }, + { + "text": "the", + "start": 27.4, + "end": 28.14, + "confidence": 0.958 + }, + { + "text": "one", + "start": 28.14, + "end": 28.28, + "confidence": 0.98 + }, + { + "text": "who", + "start": 28.28, + "end": 28.32, + "confidence": 0.671 + }, + { + "text": "is", + "start": 28.32, + "end": 28.36, + "confidence": 0.979 + }, + { + "text": "the", + "start": 28.36, + "end": 28.4, + "confidence": 0.955 + }, + { + "text": "one", + "start": 28.4, + "end": 28.8, + "confidence": 0.975 + }, + { + "text": "who", + "start": 28.8, + "end": 29.14, + "confidence": 0.683 + }, + { + "text": "is", + "start": 29.14, + "end": 29.18, + "confidence": 0.978 + }, + { + "text": "the", + "start": 29.18, + "end": 29.22, + "confidence": 0.956 + }, + { + "text": "one", + "start": 29.22, + "end": 29.56, + "confidence": 0.972 + }, + { + "text": "who", + "start": 29.56, + "end": 29.74, + "confidence": 0.695 + }, + { + "text": "is", + "start": 29.74, + "end": 29.78, + "confidence": 0.978 + }, + { + "text": "the", + "start": 29.78, + "end": 29.82, + "confidence": 0.957 + }, + { + "text": "one", + "start": 29.82, + "end": 29.86, + "confidence": 0.971 + }, + { + "text": "who", + "start": 29.86, + "end": 29.9, + "confidence": 0.713 + }, + { + "text": "is", + "start": 29.9, + "end": 29.94, + "confidence": 0.98 + }, + { + "text": "the", + "start": 29.94, + "end": 29.98, + "confidence": 0.958 + }, + { + "text": "one", + "start": 29.98, + "end": 30.02, + "confidence": 0.971 + }, + { + "text": "who", + "start": 30.02, + "end": 30.06, + "confidence": 0.737 + }, + { + "text": "is", + "start": 30.06, + "end": 30.1, + "confidence": 0.982 + }, + { + "text": "the", + "start": 30.1, + "end": 30.14, + "confidence": 0.96 + }, + { + "text": "one", + "start": 30.14, + "end": 30.18, + "confidence": 0.971 + }, + { + "text": "who", + "start": 30.18, + "end": 30.22, + "confidence": 0.754 + }, + { + "text": "is", + "start": 30.22, + "end": 30.26, + "confidence": 0.984 + }, + { + "text": "the", + "start": 30.26, + "end": 30.3, + "confidence": 0.962 + }, + { + "text": "one", + "start": 30.3, + "end": 30.34, + "confidence": 0.973 + }, + { + "text": "who", + "start": 30.34, + "end": 30.38, + "confidence": 0.759 + }, + { + "text": "is", + "start": 30.38, + "end": 30.42, + "confidence": 0.986 + }, + { + "text": "the", + "start": 30.42, + "end": 30.46, + "confidence": 0.964 + }, + { + "text": "one", + "start": 30.46, + "end": 30.5, + "confidence": 0.974 + }, + { + "text": "who", + "start": 30.5, + "end": 30.54, + "confidence": 0.765 + }, + { + "text": "is", + "start": 30.54, + "end": 30.58, + "confidence": 0.987 + }, + { + "text": "the", + "start": 30.58, + "end": 30.62, + "confidence": 0.966 + }, + { + "text": "one", + "start": 30.62, + "end": 30.66, + "confidence": 0.975 + }, + { + "text": "who", + "start": 30.66, + "end": 30.7, + "confidence": 0.774 + }, + { + "text": "is", + "start": 30.7, + "end": 30.74, + "confidence": 0.988 + }, + { + "text": "the", + "start": 30.74, + "end": 30.78, + "confidence": 0.969 + }, + { + "text": "one", + "start": 30.78, + "end": 30.82, + "confidence": 0.975 + }, + { + "text": "who", + "start": 30.82, + "end": 30.86, + "confidence": 0.801 + }, + { + "text": "is", + "start": 30.86, + "end": 30.9, + "confidence": 0.989 + }, + { + "text": "the", + "start": 30.9, + "end": 30.94, + "confidence": 0.97 + }, + { + "text": "one", + "start": 30.94, + "end": 30.98, + "confidence": 0.976 + }, + { + "text": "who", + "start": 30.98, + "end": 31.02, + "confidence": 0.818 + }, + { + "text": "is", + "start": 31.02, + "end": 31.06, + "confidence": 0.989 + }, + { + "text": "the", + "start": 31.06, + "end": 31.1, + "confidence": 0.972 + }, + { + "text": "one", + "start": 31.1, + "end": 31.14, + "confidence": 0.977 + }, + { + "text": "who", + "start": 31.14, + "end": 31.18, + "confidence": 0.838 + }, + { + "text": "is", + "start": 31.18, + "end": 31.22, + "confidence": 0.989 + }, + { + "text": "the", + "start": 31.22, + "end": 31.26, + "confidence": 0.973 + }, + { + "text": "one", + "start": 31.26, + "end": 31.3, + "confidence": 0.977 + }, + { + "text": "who", + "start": 31.3, + "end": 31.34, + "confidence": 0.862 + }, + { + "text": "is", + "start": 31.34, + "end": 31.38, + "confidence": 0.989 + }, + { + "text": "the", + "start": 31.38, + "end": 31.42, + "confidence": 0.974 + }, + { + "text": "one", + "start": 31.42, + "end": 31.46, + "confidence": 0.977 + }, + { + "text": "who", + "start": 31.46, + "end": 31.5, + "confidence": 0.882 + }, + { + "text": "is", + "start": 31.5, + "end": 31.54, + "confidence": 0.989 + }, + { + "text": "the", + "start": 31.54, + "end": 31.58, + "confidence": 0.974 + }, + { + "text": "one", + "start": 31.58, + "end": 31.62, + "confidence": 0.977 + }, + { + "text": "who", + "start": 31.62, + "end": 31.66, + "confidence": 0.895 + }, + { + "text": "is", + "start": 31.66, + "end": 31.7, + "confidence": 0.989 + }, + { + "text": "the", + "start": 31.7, + "end": 31.74, + "confidence": 0.975 + }, + { + "text": "one", + "start": 31.74, + "end": 31.78, + "confidence": 0.977 + }, + { + "text": "who", + "start": 31.78, + "end": 31.82, + "confidence": 0.905 + }, + { + "text": "is", + "start": 31.82, + "end": 31.86, + "confidence": 0.989 + }, + { + "text": "the", + "start": 31.86, + "end": 31.9, + "confidence": 0.975 + }, + { + "text": "one", + "start": 31.9, + "end": 31.94, + "confidence": 0.977 + }, + { + "text": "who", + "start": 31.94, + "end": 31.98, + "confidence": 0.92 + }, + { + "text": "is", + "start": 31.98, + "end": 32.02, + "confidence": 0.99 + }, + { + "text": "the", + "start": 32.02, + "end": 32.06, + "confidence": 0.976 + }, + { + "text": "one", + "start": 32.06, + "end": 32.1, + "confidence": 0.978 + }, + { + "text": "who", + "start": 32.1, + "end": 32.14, + "confidence": 0.924 + }, + { + "text": "is", + "start": 32.14, + "end": 32.18, + "confidence": 0.99 + }, + { + "text": "the", + "start": 32.18, + "end": 32.22, + "confidence": 0.977 + }, + { + "text": "one", + "start": 32.22, + "end": 32.26, + "confidence": 0.978 + }, + { + "text": "who", + "start": 32.26, + "end": 32.3, + "confidence": 0.932 + }, + { + "text": "is", + "start": 32.3, + "end": 32.34, + "confidence": 0.989 + }, + { + "text": "the", + "start": 32.34, + "end": 32.38, + "confidence": 0.976 + }, + { + "text": "one", + "start": 32.38, + "end": 32.42, + "confidence": 0.977 + }, + { + "text": "who", + "start": 32.42, + "end": 32.46, + "confidence": 0.936 + }, + { + "text": "is", + "start": 32.46, + "end": 32.5, + "confidence": 0.99 + }, + { + "text": "the", + "start": 32.5, + "end": 32.54, + "confidence": 0.977 + }, + { + "text": "one", + "start": 32.54, + "end": 32.58, + "confidence": 0.978 + }, + { + "text": "who", + "start": 32.58, + "end": 32.62, + "confidence": 0.94 + }, + { + "text": "is", + "start": 32.62, + "end": 32.66, + "confidence": 0.99 + }, + { + "text": "the", + "start": 32.66, + "end": 32.7, + "confidence": 0.977 + }, + { + "text": "one", + "start": 32.7, + "end": 32.74, + "confidence": 0.978 + }, + { + "text": "who", + "start": 32.74, + "end": 32.78, + "confidence": 0.942 + }, + { + "text": "is", + "start": 32.78, + "end": 32.82, + "confidence": 0.989 + }, + { + "text": "the", + "start": 32.82, + "end": 32.86, + "confidence": 0.977 + }, + { + "text": "one", + "start": 32.86, + "end": 32.9, + "confidence": 0.978 + }, + { + "text": "who", + "start": 32.9, + "end": 32.94, + "confidence": 0.941 + }, + { + "text": "is", + "start": 32.94, + "end": 32.98, + "confidence": 0.989 + }, + { + "text": "the", + "start": 32.98, + "end": 33.02, + "confidence": 0.978 + }, + { + "text": "one", + "start": 33.02, + "end": 33.06, + "confidence": 0.978 + }, + { + "text": "who", + "start": 33.06, + "end": 33.1, + "confidence": 0.942 + }, + { + "text": "is", + "start": 33.1, + "end": 33.14, + "confidence": 0.989 + }, + { + "text": "the", + "start": 33.14, + "end": 33.18, + "confidence": 0.978 + }, + { + "text": "one", + "start": 33.18, + "end": 33.22, + "confidence": 0.978 + }, + { + "text": "who", + "start": 33.22, + "end": 33.26, + "confidence": 0.942 + }, + { + "text": "is", + "start": 33.26, + "end": 33.3, + "confidence": 0.99 + }, + { + "text": "the", + "start": 33.3, + "end": 33.34, + "confidence": 0.978 + }, + { + "text": "one", + "start": 33.34, + "end": 33.38, + "confidence": 0.978 + }, + { + "text": "who", + "start": 33.38, + "end": 33.42, + "confidence": 0.941 + }, + { + "text": "is", + "start": 33.42, + "end": 33.46, + "confidence": 0.989 + }, + { + "text": "the", + "start": 33.46, + "end": 33.5, + "confidence": 0.979 + }, + { + "text": "one", + "start": 33.5, + "end": 33.54, + "confidence": 0.977 + }, + { + "text": "who", + "start": 33.54, + "end": 33.58, + "confidence": 0.941 + }, + { + "text": "is", + "start": 33.58, + "end": 33.62, + "confidence": 0.989 + }, + { + "text": "the", + "start": 33.62, + "end": 33.66, + "confidence": 0.978 + }, + { + "text": "one", + "start": 33.66, + "end": 33.7, + "confidence": 0.977 + }, + { + "text": "who", + "start": 33.7, + "end": 33.74, + "confidence": 0.939 + }, + { + "text": "is", + "start": 33.74, + "end": 33.78, + "confidence": 0.989 + }, + { + "text": "the", + "start": 33.78, + "end": 33.82, + "confidence": 0.979 + }, + { + "text": "one", + "start": 33.82, + "end": 33.86, + "confidence": 0.977 + }, + { + "text": "who", + "start": 33.86, + "end": 33.9, + "confidence": 0.939 + }, + { + "text": "is", + "start": 33.9, + "end": 33.94, + "confidence": 0.989 + }, + { + "text": "the", + "start": 33.94, + "end": 33.98, + "confidence": 0.979 + }, + { + "text": "one", + "start": 33.98, + "end": 34.02, + "confidence": 0.977 + }, + { + "text": "who", + "start": 34.02, + "end": 34.06, + "confidence": 0.938 + }, + { + "text": "is", + "start": 34.06, + "end": 34.1, + "confidence": 0.989 + }, + { + "text": "the", + "start": 34.1, + "end": 34.14, + "confidence": 0.978 + }, + { + "text": "one", + "start": 34.14, + "end": 34.18, + "confidence": 0.977 + }, + { + "text": "who", + "start": 34.18, + "end": 34.22, + "confidence": 0.936 + }, + { + "text": "is", + "start": 34.22, + "end": 34.26, + "confidence": 0.989 + }, + { + "text": "the", + "start": 34.26, + "end": 34.3, + "confidence": 0.978 + }, + { + "text": "one", + "start": 34.3, + "end": 34.34, + "confidence": 0.977 + }, + { + "text": "who", + "start": 34.34, + "end": 34.38, + "confidence": 0.936 + }, + { + "text": "is", + "start": 34.38, + "end": 34.42, + "confidence": 0.989 + }, + { + "text": "the", + "start": 34.42, + "end": 34.46, + "confidence": 0.979 + }, + { + "text": "one", + "start": 34.46, + "end": 34.5, + "confidence": 0.976 + }, + { + "text": "who", + "start": 34.5, + "end": 34.54, + "confidence": 0.936 + }, + { + "text": "is", + "start": 34.54, + "end": 34.58, + "confidence": 0.988 + }, + { + "text": "the", + "start": 34.58, + "end": 34.62, + "confidence": 0.978 + }, + { + "text": "one", + "start": 34.62, + "end": 34.66, + "confidence": 0.977 + }, + { + "text": "who", + "start": 34.66, + "end": 34.7, + "confidence": 0.936 + }, + { + "text": "is", + "start": 34.7, + "end": 34.74, + "confidence": 0.988 + }, + { + "text": "the", + "start": 34.74, + "end": 34.78, + "confidence": 0.978 + }, + { + "text": "one", + "start": 34.78, + "end": 34.82, + "confidence": 0.976 + }, + { + "text": "who", + "start": 34.82, + "end": 34.86, + "confidence": 0.935 + }, + { + "text": "is", + "start": 34.86, + "end": 34.9, + "confidence": 0.988 + }, + { + "text": "the", + "start": 34.9, + "end": 34.94, + "confidence": 0.979 + }, + { + "text": "one", + "start": 34.94, + "end": 34.98, + "confidence": 0.976 + }, + { + "text": "who", + "start": 34.98, + "end": 35.02, + "confidence": 0.936 + }, + { + "text": "is", + "start": 35.02, + "end": 35.06, + "confidence": 0.987 + }, + { + "text": "the", + "start": 35.06, + "end": 35.1, + "confidence": 0.978 + }, + { + "text": "one", + "start": 35.1, + "end": 35.14, + "confidence": 0.976 + }, + { + "text": "who", + "start": 35.14, + "end": 35.18, + "confidence": 0.936 + }, + { + "text": "is", + "start": 35.18, + "end": 35.22, + "confidence": 0.987 + }, + { + "text": "the", + "start": 35.22, + "end": 35.26, + "confidence": 0.978 + }, + { + "text": "one", + "start": 35.26, + "end": 35.3, + "confidence": 0.976 + }, + { + "text": "who", + "start": 35.3, + "end": 35.34, + "confidence": 0.935 + }, + { + "text": "is", + "start": 35.34, + "end": 35.38, + "confidence": 0.987 + }, + { + "text": "the", + "start": 35.38, + "end": 35.42, + "confidence": 0.977 + }, + { + "text": "one", + "start": 35.42, + "end": 35.46, + "confidence": 0.976 + }, + { + "text": "who", + "start": 35.46, + "end": 35.5, + "confidence": 0.934 + }, + { + "text": "is", + "start": 35.5, + "end": 35.54, + "confidence": 0.986 + }, + { + "text": "the", + "start": 35.54, + "end": 35.58, + "confidence": 0.977 + }, + { + "text": "one", + "start": 35.58, + "end": 35.62, + "confidence": 0.976 + }, + { + "text": "who", + "start": 35.62, + "end": 35.66, + "confidence": 0.933 + }, + { + "text": "is", + "start": 35.66, + "end": 35.7, + "confidence": 0.985 + }, + { + "text": "the", + "start": 35.7, + "end": 35.74, + "confidence": 0.977 + }, + { + "text": "one", + "start": 35.74, + "end": 35.78, + "confidence": 0.974 + }, + { + "text": "who", + "start": 35.78, + "end": 35.82, + "confidence": 0.939 + }, + { + "text": "is", + "start": 35.82, + "end": 35.86, + "confidence": 0.986 + }, + { + "text": "the", + "start": 35.86, + "end": 35.9, + "confidence": 0.977 + }, + { + "text": "one", + "start": 35.9, + "end": 35.94, + "confidence": 0.975 + }, + { + "text": "who", + "start": 35.94, + "end": 35.98, + "confidence": 0.932 + }, + { + "text": "is", + "start": 35.98, + "end": 36.02, + "confidence": 0.984 + }, + { + "text": "the", + "start": 36.02, + "end": 36.06, + "confidence": 0.976 + }, + { + "text": "one", + "start": 36.06, + "end": 36.1, + "confidence": 0.975 + }, + { + "text": "who", + "start": 36.1, + "end": 36.14, + "confidence": 0.931 + }, + { + "text": "is", + "start": 36.14, + "end": 36.18, + "confidence": 0.984 + }, + { + "text": "the", + "start": 36.18, + "end": 36.22, + "confidence": 0.976 + }, + { + "text": "one", + "start": 36.22, + "end": 36.26, + "confidence": 0.975 + }, + { + "text": "who", + "start": 36.26, + "end": 36.3, + "confidence": 0.929 + }, + { + "text": "is", + "start": 36.3, + "end": 36.34, + "confidence": 0.983 + }, + { + "text": "the", + "start": 36.34, + "end": 36.38, + "confidence": 0.975 + }, + { + "text": "one", + "start": 36.38, + "end": 36.42, + "confidence": 0.975 + }, + { + "text": "who", + "start": 36.42, + "end": 36.46, + "confidence": 0.929 + }, + { + "text": "is", + "start": 36.46, + "end": 36.5, + "confidence": 0.982 + }, + { + "text": "the", + "start": 36.5, + "end": 36.54, + "confidence": 0.974 + }, + { + "text": "one", + "start": 36.54, + "end": 36.58, + "confidence": 0.975 + }, + { + "text": "who", + "start": 36.58, + "end": 36.62, + "confidence": 0.928 + }, + { + "text": "is", + "start": 36.62, + "end": 36.66, + "confidence": 0.982 + }, + { + "text": "the", + "start": 36.66, + "end": 36.7, + "confidence": 0.974 + }, + { + "text": "one", + "start": 36.7, + "end": 36.74, + "confidence": 0.975 + }, + { + "text": "who", + "start": 36.74, + "end": 36.92, + "confidence": 0.928 + }, + { + "text": "is", + "start": 36.92, + "end": 36.98, + "confidence": 0.981 + }, + { + "text": "the", + "start": 36.98, + "end": 37.02, + "confidence": 0.973 + } + ] + }, + { + "id": 2, + "seek": 3700, + "start": 37.02, + "end": 67.0, + "text": " one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is", + "tokens": [ + 50363, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318 + ], + "temperature": 0.0, + "avg_logprob": -0.017284017139010958, + "compression_ratio": 26.93548387096774, + "no_speech_prob": 0.09498446434736252, + "confidence": 0.983, + "words": [ + { + "text": "one", + "start": 37.02, + "end": 37.4, + "confidence": 0.964 + }, + { + "text": "who", + "start": 37.4, + "end": 39.86, + "confidence": 0.961 + }, + { + "text": "is", + "start": 39.86, + "end": 39.9, + "confidence": 0.977 + }, + { + "text": "the", + "start": 39.9, + "end": 39.94, + "confidence": 0.975 + }, + { + "text": "one", + "start": 39.94, + "end": 39.98, + "confidence": 0.964 + }, + { + "text": "who", + "start": 39.98, + "end": 40.02, + "confidence": 0.982 + }, + { + "text": "is", + "start": 40.02, + "end": 40.06, + "confidence": 0.989 + }, + { + "text": "the", + "start": 40.06, + "end": 40.1, + "confidence": 0.978 + }, + { + "text": "one", + "start": 40.1, + "end": 40.14, + "confidence": 0.98 + }, + { + "text": "who", + "start": 40.14, + "end": 40.18, + "confidence": 0.989 + }, + { + "text": "is", + "start": 40.18, + "end": 40.22, + "confidence": 0.992 + }, + { + "text": "the", + "start": 40.22, + "end": 40.26, + "confidence": 0.97 + }, + { + "text": "one", + "start": 40.26, + "end": 40.3, + "confidence": 0.982 + }, + { + "text": "who", + "start": 40.3, + "end": 40.34, + "confidence": 0.989 + }, + { + "text": "is", + "start": 40.34, + "end": 40.38, + "confidence": 0.993 + }, + { + "text": "the", + "start": 40.38, + "end": 40.42, + "confidence": 0.971 + }, + { + "text": "one", + "start": 40.42, + "end": 40.46, + "confidence": 0.984 + }, + { + "text": "who", + "start": 40.46, + "end": 40.5, + "confidence": 0.99 + }, + { + "text": "is", + "start": 40.5, + "end": 40.54, + "confidence": 0.994 + }, + { + "text": "the", + "start": 40.54, + "end": 40.58, + "confidence": 0.969 + }, + { + "text": "one", + "start": 40.58, + "end": 40.62, + "confidence": 0.985 + }, + { + "text": "who", + "start": 40.62, + "end": 40.66, + "confidence": 0.989 + }, + { + "text": "is", + "start": 40.66, + "end": 40.7, + "confidence": 0.991 + }, + { + "text": "the", + "start": 40.7, + "end": 40.74, + "confidence": 0.625 + }, + { + "text": "one", + "start": 40.74, + "end": 40.78, + "confidence": 0.947 + }, + { + "text": "who", + "start": 40.78, + "end": 40.82, + "confidence": 0.985 + }, + { + "text": "is", + "start": 40.82, + "end": 40.86, + "confidence": 0.99 + }, + { + "text": "the", + "start": 40.86, + "end": 40.9, + "confidence": 0.91 + }, + { + "text": "one", + "start": 40.9, + "end": 40.94, + "confidence": 0.984 + }, + { + "text": "who", + "start": 40.94, + "end": 40.98, + "confidence": 0.986 + }, + { + "text": "is", + "start": 40.98, + "end": 41.02, + "confidence": 0.994 + }, + { + "text": "the", + "start": 41.02, + "end": 41.06, + "confidence": 0.933 + }, + { + "text": "one", + "start": 41.06, + "end": 41.1, + "confidence": 0.985 + }, + { + "text": "who", + "start": 41.1, + "end": 41.14, + "confidence": 0.988 + }, + { + "text": "is", + "start": 41.14, + "end": 41.18, + "confidence": 0.996 + }, + { + "text": "the", + "start": 41.18, + "end": 41.22, + "confidence": 0.948 + }, + { + "text": "one", + "start": 41.22, + "end": 41.26, + "confidence": 0.987 + }, + { + "text": "who", + "start": 41.26, + "end": 41.3, + "confidence": 0.989 + }, + { + "text": "is", + "start": 41.3, + "end": 41.34, + "confidence": 0.997 + }, + { + "text": "the", + "start": 41.34, + "end": 41.38, + "confidence": 0.961 + }, + { + "text": "one", + "start": 41.38, + "end": 41.42, + "confidence": 0.988 + }, + { + "text": "who", + "start": 41.42, + "end": 41.46, + "confidence": 0.99 + }, + { + "text": "is", + "start": 41.46, + "end": 41.5, + "confidence": 0.997 + }, + { + "text": "the", + "start": 41.5, + "end": 41.54, + "confidence": 0.969 + }, + { + "text": "one", + "start": 41.54, + "end": 41.58, + "confidence": 0.989 + }, + { + "text": "who", + "start": 41.58, + "end": 41.62, + "confidence": 0.99 + }, + { + "text": "is", + "start": 41.62, + "end": 41.66, + "confidence": 0.998 + }, + { + "text": "the", + "start": 41.66, + "end": 41.7, + "confidence": 0.976 + }, + { + "text": "one", + "start": 41.7, + "end": 41.74, + "confidence": 0.99 + }, + { + "text": "who", + "start": 41.74, + "end": 41.78, + "confidence": 0.99 + }, + { + "text": "is", + "start": 41.78, + "end": 41.82, + "confidence": 0.998 + }, + { + "text": "the", + "start": 41.82, + "end": 41.86, + "confidence": 0.981 + }, + { + "text": "one", + "start": 41.86, + "end": 41.9, + "confidence": 0.99 + }, + { + "text": "who", + "start": 41.9, + "end": 41.94, + "confidence": 0.99 + }, + { + "text": "is", + "start": 41.94, + "end": 41.98, + "confidence": 0.998 + }, + { + "text": "the", + "start": 41.98, + "end": 42.02, + "confidence": 0.984 + }, + { + "text": "one", + "start": 42.02, + "end": 42.06, + "confidence": 0.991 + }, + { + "text": "who", + "start": 42.06, + "end": 42.1, + "confidence": 0.99 + }, + { + "text": "is", + "start": 42.1, + "end": 42.14, + "confidence": 0.998 + }, + { + "text": "the", + "start": 42.14, + "end": 42.18, + "confidence": 0.987 + }, + { + "text": "one", + "start": 42.18, + "end": 42.22, + "confidence": 0.991 + }, + { + "text": "who", + "start": 42.22, + "end": 42.26, + "confidence": 0.99 + }, + { + "text": "is", + "start": 42.26, + "end": 42.3, + "confidence": 0.998 + }, + { + "text": "the", + "start": 42.3, + "end": 42.34, + "confidence": 0.988 + }, + { + "text": "one", + "start": 42.34, + "end": 42.38, + "confidence": 0.991 + }, + { + "text": "who", + "start": 42.38, + "end": 42.42, + "confidence": 0.989 + }, + { + "text": "is", + "start": 42.42, + "end": 42.46, + "confidence": 0.999 + }, + { + "text": "the", + "start": 42.46, + "end": 42.5, + "confidence": 0.989 + }, + { + "text": "one", + "start": 42.5, + "end": 42.54, + "confidence": 0.991 + }, + { + "text": "who", + "start": 42.54, + "end": 42.58, + "confidence": 0.989 + }, + { + "text": "is", + "start": 42.58, + "end": 42.62, + "confidence": 0.999 + }, + { + "text": "the", + "start": 42.62, + "end": 42.66, + "confidence": 0.99 + }, + { + "text": "one", + "start": 42.66, + "end": 42.7, + "confidence": 0.991 + }, + { + "text": "who", + "start": 42.7, + "end": 42.74, + "confidence": 0.989 + }, + { + "text": "is", + "start": 42.74, + "end": 42.78, + "confidence": 0.999 + }, + { + "text": "the", + "start": 42.78, + "end": 42.82, + "confidence": 0.99 + }, + { + "text": "one", + "start": 42.82, + "end": 42.86, + "confidence": 0.992 + }, + { + "text": "who", + "start": 42.86, + "end": 42.9, + "confidence": 0.988 + }, + { + "text": "is", + "start": 42.9, + "end": 42.94, + "confidence": 0.999 + }, + { + "text": "the", + "start": 42.94, + "end": 42.98, + "confidence": 0.991 + }, + { + "text": "one", + "start": 42.98, + "end": 43.02, + "confidence": 0.991 + }, + { + "text": "who", + "start": 43.02, + "end": 43.06, + "confidence": 0.988 + }, + { + "text": "is", + "start": 43.06, + "end": 43.1, + "confidence": 0.999 + }, + { + "text": "the", + "start": 43.1, + "end": 43.14, + "confidence": 0.991 + }, + { + "text": "one", + "start": 43.14, + "end": 43.18, + "confidence": 0.991 + }, + { + "text": "who", + "start": 43.18, + "end": 43.22, + "confidence": 0.988 + }, + { + "text": "is", + "start": 43.22, + "end": 43.26, + "confidence": 0.999 + }, + { + "text": "the", + "start": 43.26, + "end": 43.3, + "confidence": 0.991 + }, + { + "text": "one", + "start": 43.3, + "end": 43.34, + "confidence": 0.991 + }, + { + "text": "who", + "start": 43.34, + "end": 43.38, + "confidence": 0.988 + }, + { + "text": "is", + "start": 43.38, + "end": 43.42, + "confidence": 0.999 + }, + { + "text": "the", + "start": 43.42, + "end": 43.46, + "confidence": 0.991 + }, + { + "text": "one", + "start": 43.46, + "end": 43.5, + "confidence": 0.991 + }, + { + "text": "who", + "start": 43.5, + "end": 43.54, + "confidence": 0.987 + }, + { + "text": "is", + "start": 43.54, + "end": 43.58, + "confidence": 0.999 + }, + { + "text": "the", + "start": 43.58, + "end": 43.62, + "confidence": 0.991 + }, + { + "text": "one", + "start": 43.62, + "end": 43.66, + "confidence": 0.991 + }, + { + "text": "who", + "start": 43.66, + "end": 43.7, + "confidence": 0.987 + }, + { + "text": "is", + "start": 43.7, + "end": 43.74, + "confidence": 0.999 + }, + { + "text": "the", + "start": 43.74, + "end": 43.78, + "confidence": 0.991 + }, + { + "text": "one", + "start": 43.78, + "end": 43.82, + "confidence": 0.991 + }, + { + "text": "who", + "start": 43.82, + "end": 43.86, + "confidence": 0.987 + }, + { + "text": "is", + "start": 43.86, + "end": 43.9, + "confidence": 0.999 + }, + { + "text": "the", + "start": 43.9, + "end": 43.94, + "confidence": 0.991 + }, + { + "text": "one", + "start": 43.94, + "end": 43.98, + "confidence": 0.99 + }, + { + "text": "who", + "start": 43.98, + "end": 44.02, + "confidence": 0.986 + }, + { + "text": "is", + "start": 44.02, + "end": 44.06, + "confidence": 0.999 + }, + { + "text": "the", + "start": 44.06, + "end": 44.1, + "confidence": 0.991 + }, + { + "text": "one", + "start": 44.1, + "end": 44.14, + "confidence": 0.99 + }, + { + "text": "who", + "start": 44.14, + "end": 44.18, + "confidence": 0.986 + }, + { + "text": "is", + "start": 44.18, + "end": 44.22, + "confidence": 0.999 + }, + { + "text": "the", + "start": 44.22, + "end": 44.26, + "confidence": 0.991 + }, + { + "text": "one", + "start": 44.26, + "end": 44.3, + "confidence": 0.99 + }, + { + "text": "who", + "start": 44.3, + "end": 44.34, + "confidence": 0.985 + }, + { + "text": "is", + "start": 44.34, + "end": 44.38, + "confidence": 0.999 + }, + { + "text": "the", + "start": 44.38, + "end": 44.42, + "confidence": 0.991 + }, + { + "text": "one", + "start": 44.42, + "end": 44.46, + "confidence": 0.99 + }, + { + "text": "who", + "start": 44.46, + "end": 44.5, + "confidence": 0.985 + }, + { + "text": "is", + "start": 44.5, + "end": 44.54, + "confidence": 0.998 + }, + { + "text": "the", + "start": 44.54, + "end": 44.58, + "confidence": 0.991 + }, + { + "text": "one", + "start": 44.58, + "end": 44.62, + "confidence": 0.989 + }, + { + "text": "who", + "start": 44.62, + "end": 44.66, + "confidence": 0.984 + }, + { + "text": "is", + "start": 44.66, + "end": 44.7, + "confidence": 0.998 + }, + { + "text": "the", + "start": 44.7, + "end": 44.74, + "confidence": 0.991 + }, + { + "text": "one", + "start": 44.74, + "end": 44.78, + "confidence": 0.989 + }, + { + "text": "who", + "start": 44.78, + "end": 44.82, + "confidence": 0.983 + }, + { + "text": "is", + "start": 44.82, + "end": 44.86, + "confidence": 0.998 + }, + { + "text": "the", + "start": 44.86, + "end": 44.9, + "confidence": 0.991 + }, + { + "text": "one", + "start": 44.9, + "end": 44.94, + "confidence": 0.989 + }, + { + "text": "who", + "start": 44.94, + "end": 44.98, + "confidence": 0.983 + }, + { + "text": "is", + "start": 44.98, + "end": 45.02, + "confidence": 0.998 + }, + { + "text": "the", + "start": 45.02, + "end": 45.06, + "confidence": 0.991 + }, + { + "text": "one", + "start": 45.06, + "end": 45.1, + "confidence": 0.988 + }, + { + "text": "who", + "start": 45.1, + "end": 45.14, + "confidence": 0.982 + }, + { + "text": "is", + "start": 45.14, + "end": 45.18, + "confidence": 0.998 + }, + { + "text": "the", + "start": 45.18, + "end": 45.22, + "confidence": 0.99 + }, + { + "text": "one", + "start": 45.22, + "end": 45.26, + "confidence": 0.988 + }, + { + "text": "who", + "start": 45.26, + "end": 45.3, + "confidence": 0.98 + }, + { + "text": "is", + "start": 45.3, + "end": 45.34, + "confidence": 0.998 + }, + { + "text": "the", + "start": 45.34, + "end": 45.38, + "confidence": 0.99 + }, + { + "text": "one", + "start": 45.38, + "end": 45.42, + "confidence": 0.987 + }, + { + "text": "who", + "start": 45.42, + "end": 45.46, + "confidence": 0.979 + }, + { + "text": "is", + "start": 45.46, + "end": 45.5, + "confidence": 0.998 + }, + { + "text": "the", + "start": 45.5, + "end": 45.54, + "confidence": 0.99 + }, + { + "text": "one", + "start": 45.54, + "end": 45.58, + "confidence": 0.987 + }, + { + "text": "who", + "start": 45.58, + "end": 45.62, + "confidence": 0.978 + }, + { + "text": "is", + "start": 45.62, + "end": 45.66, + "confidence": 0.997 + }, + { + "text": "the", + "start": 45.66, + "end": 45.7, + "confidence": 0.99 + }, + { + "text": "one", + "start": 45.7, + "end": 45.74, + "confidence": 0.986 + }, + { + "text": "who", + "start": 45.74, + "end": 45.78, + "confidence": 0.976 + }, + { + "text": "is", + "start": 45.78, + "end": 45.82, + "confidence": 0.997 + }, + { + "text": "the", + "start": 45.82, + "end": 45.86, + "confidence": 0.989 + }, + { + "text": "one", + "start": 45.86, + "end": 45.9, + "confidence": 0.986 + }, + { + "text": "who", + "start": 45.9, + "end": 45.94, + "confidence": 0.976 + }, + { + "text": "is", + "start": 45.94, + "end": 45.98, + "confidence": 0.997 + }, + { + "text": "the", + "start": 45.98, + "end": 46.02, + "confidence": 0.989 + }, + { + "text": "one", + "start": 46.02, + "end": 46.06, + "confidence": 0.986 + }, + { + "text": "who", + "start": 46.06, + "end": 46.1, + "confidence": 0.974 + }, + { + "text": "is", + "start": 46.1, + "end": 46.14, + "confidence": 0.997 + }, + { + "text": "the", + "start": 46.14, + "end": 46.18, + "confidence": 0.989 + }, + { + "text": "one", + "start": 46.18, + "end": 46.22, + "confidence": 0.985 + }, + { + "text": "who", + "start": 46.22, + "end": 46.26, + "confidence": 0.972 + }, + { + "text": "is", + "start": 46.26, + "end": 46.3, + "confidence": 0.996 + }, + { + "text": "the", + "start": 46.3, + "end": 46.34, + "confidence": 0.988 + }, + { + "text": "one", + "start": 46.34, + "end": 46.38, + "confidence": 0.984 + }, + { + "text": "who", + "start": 46.38, + "end": 46.42, + "confidence": 0.971 + }, + { + "text": "is", + "start": 46.42, + "end": 46.46, + "confidence": 0.996 + }, + { + "text": "the", + "start": 46.46, + "end": 46.5, + "confidence": 0.988 + }, + { + "text": "one", + "start": 46.5, + "end": 46.54, + "confidence": 0.984 + }, + { + "text": "who", + "start": 46.54, + "end": 46.58, + "confidence": 0.97 + }, + { + "text": "is", + "start": 46.58, + "end": 46.62, + "confidence": 0.996 + }, + { + "text": "the", + "start": 46.62, + "end": 46.66, + "confidence": 0.987 + }, + { + "text": "one", + "start": 46.66, + "end": 46.7, + "confidence": 0.984 + }, + { + "text": "who", + "start": 46.7, + "end": 46.74, + "confidence": 0.968 + }, + { + "text": "is", + "start": 46.74, + "end": 46.78, + "confidence": 0.995 + }, + { + "text": "the", + "start": 46.78, + "end": 46.82, + "confidence": 0.987 + }, + { + "text": "one", + "start": 46.82, + "end": 46.86, + "confidence": 0.983 + }, + { + "text": "who", + "start": 46.86, + "end": 46.9, + "confidence": 0.966 + }, + { + "text": "is", + "start": 46.9, + "end": 46.94, + "confidence": 0.995 + }, + { + "text": "the", + "start": 46.94, + "end": 46.98, + "confidence": 0.986 + }, + { + "text": "one", + "start": 46.98, + "end": 47.02, + "confidence": 0.982 + }, + { + "text": "who", + "start": 47.02, + "end": 47.06, + "confidence": 0.964 + }, + { + "text": "is", + "start": 47.06, + "end": 47.1, + "confidence": 0.995 + }, + { + "text": "the", + "start": 47.1, + "end": 47.14, + "confidence": 0.986 + }, + { + "text": "one", + "start": 47.14, + "end": 47.18, + "confidence": 0.982 + }, + { + "text": "who", + "start": 47.18, + "end": 47.22, + "confidence": 0.963 + }, + { + "text": "is", + "start": 47.22, + "end": 47.26, + "confidence": 0.994 + }, + { + "text": "the", + "start": 47.26, + "end": 47.3, + "confidence": 0.985 + }, + { + "text": "one", + "start": 47.3, + "end": 47.34, + "confidence": 0.981 + }, + { + "text": "who", + "start": 47.34, + "end": 47.38, + "confidence": 0.959 + }, + { + "text": "is", + "start": 47.38, + "end": 47.42, + "confidence": 0.993 + }, + { + "text": "the", + "start": 47.42, + "end": 47.46, + "confidence": 0.984 + }, + { + "text": "one", + "start": 47.46, + "end": 47.5, + "confidence": 0.98 + }, + { + "text": "who", + "start": 47.5, + "end": 47.54, + "confidence": 0.958 + }, + { + "text": "is", + "start": 47.54, + "end": 47.58, + "confidence": 0.993 + }, + { + "text": "the", + "start": 47.58, + "end": 47.62, + "confidence": 0.983 + }, + { + "text": "one", + "start": 47.62, + "end": 47.66, + "confidence": 0.979 + }, + { + "text": "who", + "start": 47.66, + "end": 47.7, + "confidence": 0.955 + }, + { + "text": "is", + "start": 47.7, + "end": 47.74, + "confidence": 0.993 + }, + { + "text": "the", + "start": 47.74, + "end": 47.78, + "confidence": 0.982 + }, + { + "text": "one", + "start": 47.78, + "end": 47.82, + "confidence": 0.979 + }, + { + "text": "who", + "start": 47.82, + "end": 47.86, + "confidence": 0.953 + }, + { + "text": "is", + "start": 47.86, + "end": 47.9, + "confidence": 0.992 + }, + { + "text": "the", + "start": 47.9, + "end": 47.94, + "confidence": 0.982 + }, + { + "text": "one", + "start": 47.94, + "end": 47.98, + "confidence": 0.978 + }, + { + "text": "who", + "start": 47.98, + "end": 48.02, + "confidence": 0.952 + }, + { + "text": "is", + "start": 48.02, + "end": 48.06, + "confidence": 0.992 + }, + { + "text": "the", + "start": 48.06, + "end": 48.1, + "confidence": 0.981 + }, + { + "text": "one", + "start": 48.1, + "end": 48.14, + "confidence": 0.976 + }, + { + "text": "who", + "start": 48.14, + "end": 48.18, + "confidence": 0.95 + }, + { + "text": "is", + "start": 48.18, + "end": 48.22, + "confidence": 0.991 + }, + { + "text": "the", + "start": 48.22, + "end": 48.26, + "confidence": 0.98 + }, + { + "text": "one", + "start": 48.26, + "end": 48.3, + "confidence": 0.976 + }, + { + "text": "who", + "start": 48.3, + "end": 48.34, + "confidence": 0.949 + }, + { + "text": "is", + "start": 48.34, + "end": 48.38, + "confidence": 0.991 + }, + { + "text": "the", + "start": 48.38, + "end": 48.42, + "confidence": 0.979 + }, + { + "text": "one", + "start": 48.42, + "end": 48.46, + "confidence": 0.976 + }, + { + "text": "who", + "start": 48.46, + "end": 48.5, + "confidence": 0.944 + }, + { + "text": "is", + "start": 48.5, + "end": 48.54, + "confidence": 0.99 + }, + { + "text": "the", + "start": 48.54, + "end": 48.58, + "confidence": 0.979 + }, + { + "text": "one", + "start": 48.58, + "end": 48.62, + "confidence": 0.975 + }, + { + "text": "who", + "start": 48.62, + "end": 48.66, + "confidence": 0.945 + }, + { + "text": "is", + "start": 48.66, + "end": 67.0, + "confidence": 0.99 + } + ] + } + ], + "language": "en" +} \ No newline at end of file diff --git a/tests/expected/small.en/arabic.mp3.words.json b/tests/expected/small.en/arabic.mp3.words.json new file mode 100644 index 0000000000000000000000000000000000000000..190e702c32876986132ac46515c9177cad2b5b22 --- /dev/null +++ b/tests/expected/small.en/arabic.mp3.words.json @@ -0,0 +1,3348 @@ +{ + "text": " I am the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is", + "segments": [ + { + "id": 0, + "seek": 0, + "start": 2.92, + "end": 7.72, + "text": " I am the one who is the one who is the one who is the one who is the one who is the one", + "tokens": [ + 50363, + 314, + 716, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 50713 + ], + "temperature": 0.0, + "avg_logprob": -0.2332169426812066, + "compression_ratio": 24.294117647058822, + "no_speech_prob": 0.6509259939193726, + "confidence": 0.358, + "words": [ + { + "text": "I", + "start": 2.92, + "end": 3.16, + "confidence": 0.053 + }, + { + "text": "am", + "start": 3.16, + "end": 4.04, + "confidence": 0.152 + }, + { + "text": "the", + "start": 4.04, + "end": 5.44, + "confidence": 0.144 + }, + { + "text": "one", + "start": 5.44, + "end": 6.1, + "confidence": 0.086 + }, + { + "text": "who", + "start": 6.1, + "end": 6.18, + "confidence": 0.718 + }, + { + "text": "is", + "start": 6.18, + "end": 6.22, + "confidence": 0.119 + }, + { + "text": "the", + "start": 6.22, + "end": 6.24, + "confidence": 0.134 + }, + { + "text": "one", + "start": 6.24, + "end": 6.72, + "confidence": 0.203 + }, + { + "text": "who", + "start": 6.72, + "end": 6.74, + "confidence": 0.618 + }, + { + "text": "is", + "start": 6.74, + "end": 7.18, + "confidence": 0.319 + }, + { + "text": "the", + "start": 7.18, + "end": 7.2, + "confidence": 0.38 + }, + { + "text": "one", + "start": 7.2, + "end": 7.48, + "confidence": 0.443 + }, + { + "text": "who", + "start": 7.48, + "end": 7.5, + "confidence": 0.447 + }, + { + "text": "is", + "start": 7.5, + "end": 7.52, + "confidence": 0.518 + }, + { + "text": "the", + "start": 7.52, + "end": 7.54, + "confidence": 0.542 + }, + { + "text": "one", + "start": 7.54, + "end": 7.56, + "confidence": 0.724 + }, + { + "text": "who", + "start": 7.56, + "end": 7.58, + "confidence": 0.433 + }, + { + "text": "is", + "start": 7.58, + "end": 7.6, + "confidence": 0.677 + }, + { + "text": "the", + "start": 7.6, + "end": 7.62, + "confidence": 0.638 + }, + { + "text": "one", + "start": 7.62, + "end": 7.64, + "confidence": 0.817 + }, + { + "text": "who", + "start": 7.64, + "end": 7.66, + "confidence": 0.504 + }, + { + "text": "is", + "start": 7.66, + "end": 7.68, + "confidence": 0.74 + }, + { + "text": "the", + "start": 7.68, + "end": 7.7, + "confidence": 0.696 + }, + { + "text": "one", + "start": 7.7, + "end": 7.72, + "confidence": 0.697 + } + ] + }, + { + "id": 1, + "seek": 700, + "start": 7.72, + "end": 37.18, + "text": " who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the", + "tokens": [ + 50363, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262 + ], + "temperature": 0.0, + "avg_logprob": -0.07849001566569011, + "compression_ratio": 26.93548387096774, + "no_speech_prob": 0.6889318823814392, + "confidence": 0.925, + "words": [ + { + "text": "who", + "start": 7.72, + "end": 7.74, + "confidence": 0.214 + }, + { + "text": "is", + "start": 7.74, + "end": 7.76, + "confidence": 0.892 + }, + { + "text": "the", + "start": 7.76, + "end": 7.78, + "confidence": 0.918 + }, + { + "text": "one", + "start": 7.78, + "end": 9.96, + "confidence": 0.955 + }, + { + "text": "who", + "start": 9.96, + "end": 13.46, + "confidence": 0.905 + }, + { + "text": "is", + "start": 13.46, + "end": 14.0, + "confidence": 0.908 + }, + { + "text": "the", + "start": 14.0, + "end": 14.38, + "confidence": 0.942 + }, + { + "text": "one", + "start": 14.38, + "end": 14.4, + "confidence": 0.977 + }, + { + "text": "who", + "start": 14.4, + "end": 14.42, + "confidence": 0.759 + }, + { + "text": "is", + "start": 14.42, + "end": 14.44, + "confidence": 0.932 + }, + { + "text": "the", + "start": 14.44, + "end": 15.24, + "confidence": 0.957 + }, + { + "text": "one", + "start": 15.24, + "end": 18.0, + "confidence": 0.982 + }, + { + "text": "who", + "start": 18.0, + "end": 18.02, + "confidence": 0.582 + }, + { + "text": "is", + "start": 18.02, + "end": 18.04, + "confidence": 0.944 + }, + { + "text": "the", + "start": 18.04, + "end": 18.06, + "confidence": 0.953 + }, + { + "text": "one", + "start": 18.06, + "end": 18.08, + "confidence": 0.98 + }, + { + "text": "who", + "start": 18.08, + "end": 19.38, + "confidence": 0.578 + }, + { + "text": "is", + "start": 19.38, + "end": 19.9, + "confidence": 0.953 + }, + { + "text": "the", + "start": 19.9, + "end": 19.92, + "confidence": 0.95 + }, + { + "text": "one", + "start": 19.92, + "end": 19.94, + "confidence": 0.98 + }, + { + "text": "who", + "start": 19.94, + "end": 19.96, + "confidence": 0.592 + }, + { + "text": "is", + "start": 19.96, + "end": 20.88, + "confidence": 0.95 + }, + { + "text": "the", + "start": 20.88, + "end": 21.28, + "confidence": 0.872 + }, + { + "text": "one", + "start": 21.28, + "end": 21.52, + "confidence": 0.902 + }, + { + "text": "who", + "start": 21.52, + "end": 21.54, + "confidence": 0.5 + }, + { + "text": "is", + "start": 21.54, + "end": 22.04, + "confidence": 0.943 + }, + { + "text": "the", + "start": 22.04, + "end": 22.24, + "confidence": 0.898 + }, + { + "text": "one", + "start": 22.24, + "end": 25.3, + "confidence": 0.98 + }, + { + "text": "who", + "start": 25.3, + "end": 25.32, + "confidence": 0.542 + }, + { + "text": "is", + "start": 25.32, + "end": 26.18, + "confidence": 0.953 + }, + { + "text": "the", + "start": 26.18, + "end": 26.64, + "confidence": 0.904 + }, + { + "text": "one", + "start": 26.64, + "end": 26.92, + "confidence": 0.976 + }, + { + "text": "who", + "start": 26.92, + "end": 26.94, + "confidence": 0.587 + }, + { + "text": "is", + "start": 26.94, + "end": 27.42, + "confidence": 0.953 + }, + { + "text": "the", + "start": 27.42, + "end": 28.08, + "confidence": 0.903 + }, + { + "text": "one", + "start": 28.08, + "end": 28.1, + "confidence": 0.968 + }, + { + "text": "who", + "start": 28.1, + "end": 28.12, + "confidence": 0.604 + }, + { + "text": "is", + "start": 28.12, + "end": 28.14, + "confidence": 0.956 + }, + { + "text": "the", + "start": 28.14, + "end": 28.16, + "confidence": 0.91 + }, + { + "text": "one", + "start": 28.16, + "end": 28.46, + "confidence": 0.963 + }, + { + "text": "who", + "start": 28.46, + "end": 28.48, + "confidence": 0.623 + }, + { + "text": "is", + "start": 28.48, + "end": 28.5, + "confidence": 0.96 + }, + { + "text": "the", + "start": 28.5, + "end": 28.52, + "confidence": 0.92 + }, + { + "text": "one", + "start": 28.52, + "end": 30.08, + "confidence": 0.961 + }, + { + "text": "who", + "start": 30.08, + "end": 30.1, + "confidence": 0.65 + }, + { + "text": "is", + "start": 30.1, + "end": 30.12, + "confidence": 0.965 + }, + { + "text": "the", + "start": 30.12, + "end": 30.3, + "confidence": 0.93 + }, + { + "text": "one", + "start": 30.3, + "end": 30.32, + "confidence": 0.961 + }, + { + "text": "who", + "start": 30.32, + "end": 31.0, + "confidence": 0.672 + }, + { + "text": "is", + "start": 31.0, + "end": 31.52, + "confidence": 0.971 + }, + { + "text": "the", + "start": 31.52, + "end": 31.54, + "confidence": 0.94 + }, + { + "text": "one", + "start": 31.54, + "end": 32.26, + "confidence": 0.962 + }, + { + "text": "who", + "start": 32.26, + "end": 32.48, + "confidence": 0.704 + }, + { + "text": "is", + "start": 32.48, + "end": 33.26, + "confidence": 0.976 + }, + { + "text": "the", + "start": 33.26, + "end": 33.28, + "confidence": 0.946 + }, + { + "text": "one", + "start": 33.28, + "end": 33.56, + "confidence": 0.964 + }, + { + "text": "who", + "start": 33.56, + "end": 33.86, + "confidence": 0.723 + }, + { + "text": "is", + "start": 33.86, + "end": 33.88, + "confidence": 0.979 + }, + { + "text": "the", + "start": 33.88, + "end": 33.9, + "confidence": 0.951 + }, + { + "text": "one", + "start": 33.9, + "end": 33.92, + "confidence": 0.966 + }, + { + "text": "who", + "start": 33.92, + "end": 33.94, + "confidence": 0.747 + }, + { + "text": "is", + "start": 33.94, + "end": 33.96, + "confidence": 0.982 + }, + { + "text": "the", + "start": 33.96, + "end": 33.98, + "confidence": 0.956 + }, + { + "text": "one", + "start": 33.98, + "end": 34.0, + "confidence": 0.967 + }, + { + "text": "who", + "start": 34.0, + "end": 34.02, + "confidence": 0.757 + }, + { + "text": "is", + "start": 34.02, + "end": 34.04, + "confidence": 0.984 + }, + { + "text": "the", + "start": 34.04, + "end": 34.06, + "confidence": 0.961 + }, + { + "text": "one", + "start": 34.06, + "end": 34.08, + "confidence": 0.969 + }, + { + "text": "who", + "start": 34.08, + "end": 34.1, + "confidence": 0.776 + }, + { + "text": "is", + "start": 34.1, + "end": 34.12, + "confidence": 0.986 + }, + { + "text": "the", + "start": 34.12, + "end": 34.14, + "confidence": 0.965 + }, + { + "text": "one", + "start": 34.14, + "end": 34.16, + "confidence": 0.97 + }, + { + "text": "who", + "start": 34.16, + "end": 34.18, + "confidence": 0.8 + }, + { + "text": "is", + "start": 34.18, + "end": 34.2, + "confidence": 0.987 + }, + { + "text": "the", + "start": 34.2, + "end": 34.22, + "confidence": 0.968 + }, + { + "text": "one", + "start": 34.22, + "end": 34.24, + "confidence": 0.971 + }, + { + "text": "who", + "start": 34.24, + "end": 34.26, + "confidence": 0.82 + }, + { + "text": "is", + "start": 34.26, + "end": 34.28, + "confidence": 0.987 + }, + { + "text": "the", + "start": 34.28, + "end": 34.3, + "confidence": 0.969 + }, + { + "text": "one", + "start": 34.3, + "end": 34.32, + "confidence": 0.972 + }, + { + "text": "who", + "start": 34.32, + "end": 34.34, + "confidence": 0.836 + }, + { + "text": "is", + "start": 34.34, + "end": 34.36, + "confidence": 0.988 + }, + { + "text": "the", + "start": 34.36, + "end": 34.38, + "confidence": 0.971 + }, + { + "text": "one", + "start": 34.38, + "end": 34.4, + "confidence": 0.972 + }, + { + "text": "who", + "start": 34.4, + "end": 34.42, + "confidence": 0.872 + }, + { + "text": "is", + "start": 34.42, + "end": 34.44, + "confidence": 0.988 + }, + { + "text": "the", + "start": 34.44, + "end": 34.46, + "confidence": 0.972 + }, + { + "text": "one", + "start": 34.46, + "end": 34.48, + "confidence": 0.973 + }, + { + "text": "who", + "start": 34.48, + "end": 34.5, + "confidence": 0.889 + }, + { + "text": "is", + "start": 34.5, + "end": 34.52, + "confidence": 0.988 + }, + { + "text": "the", + "start": 34.52, + "end": 34.54, + "confidence": 0.973 + }, + { + "text": "one", + "start": 34.54, + "end": 34.56, + "confidence": 0.973 + }, + { + "text": "who", + "start": 34.56, + "end": 34.58, + "confidence": 0.899 + }, + { + "text": "is", + "start": 34.58, + "end": 34.6, + "confidence": 0.988 + }, + { + "text": "the", + "start": 34.6, + "end": 34.62, + "confidence": 0.973 + }, + { + "text": "one", + "start": 34.62, + "end": 34.64, + "confidence": 0.973 + }, + { + "text": "who", + "start": 34.64, + "end": 34.66, + "confidence": 0.912 + }, + { + "text": "is", + "start": 34.66, + "end": 34.68, + "confidence": 0.989 + }, + { + "text": "the", + "start": 34.68, + "end": 34.7, + "confidence": 0.973 + }, + { + "text": "one", + "start": 34.7, + "end": 34.72, + "confidence": 0.973 + }, + { + "text": "who", + "start": 34.72, + "end": 34.74, + "confidence": 0.921 + }, + { + "text": "is", + "start": 34.74, + "end": 34.76, + "confidence": 0.988 + }, + { + "text": "the", + "start": 34.76, + "end": 34.78, + "confidence": 0.974 + }, + { + "text": "one", + "start": 34.78, + "end": 34.8, + "confidence": 0.974 + }, + { + "text": "who", + "start": 34.8, + "end": 34.82, + "confidence": 0.927 + }, + { + "text": "is", + "start": 34.82, + "end": 34.84, + "confidence": 0.989 + }, + { + "text": "the", + "start": 34.84, + "end": 34.86, + "confidence": 0.974 + }, + { + "text": "one", + "start": 34.86, + "end": 34.88, + "confidence": 0.974 + }, + { + "text": "who", + "start": 34.88, + "end": 34.9, + "confidence": 0.935 + }, + { + "text": "is", + "start": 34.9, + "end": 34.92, + "confidence": 0.988 + }, + { + "text": "the", + "start": 34.92, + "end": 34.94, + "confidence": 0.974 + }, + { + "text": "one", + "start": 34.94, + "end": 34.96, + "confidence": 0.974 + }, + { + "text": "who", + "start": 34.96, + "end": 34.98, + "confidence": 0.934 + }, + { + "text": "is", + "start": 34.98, + "end": 35.0, + "confidence": 0.988 + }, + { + "text": "the", + "start": 35.0, + "end": 35.02, + "confidence": 0.975 + }, + { + "text": "one", + "start": 35.02, + "end": 35.04, + "confidence": 0.974 + }, + { + "text": "who", + "start": 35.04, + "end": 35.06, + "confidence": 0.937 + }, + { + "text": "is", + "start": 35.06, + "end": 35.08, + "confidence": 0.989 + }, + { + "text": "the", + "start": 35.08, + "end": 35.1, + "confidence": 0.976 + }, + { + "text": "one", + "start": 35.1, + "end": 35.12, + "confidence": 0.974 + }, + { + "text": "who", + "start": 35.12, + "end": 35.14, + "confidence": 0.937 + }, + { + "text": "is", + "start": 35.14, + "end": 35.16, + "confidence": 0.988 + }, + { + "text": "the", + "start": 35.16, + "end": 35.18, + "confidence": 0.976 + }, + { + "text": "one", + "start": 35.18, + "end": 35.2, + "confidence": 0.974 + }, + { + "text": "who", + "start": 35.2, + "end": 35.22, + "confidence": 0.934 + }, + { + "text": "is", + "start": 35.22, + "end": 35.24, + "confidence": 0.988 + }, + { + "text": "the", + "start": 35.24, + "end": 35.26, + "confidence": 0.976 + }, + { + "text": "one", + "start": 35.26, + "end": 35.28, + "confidence": 0.975 + }, + { + "text": "who", + "start": 35.28, + "end": 35.3, + "confidence": 0.933 + }, + { + "text": "is", + "start": 35.3, + "end": 35.32, + "confidence": 0.988 + }, + { + "text": "the", + "start": 35.32, + "end": 35.34, + "confidence": 0.977 + }, + { + "text": "one", + "start": 35.34, + "end": 35.36, + "confidence": 0.975 + }, + { + "text": "who", + "start": 35.36, + "end": 35.38, + "confidence": 0.93 + }, + { + "text": "is", + "start": 35.38, + "end": 35.4, + "confidence": 0.988 + }, + { + "text": "the", + "start": 35.4, + "end": 35.42, + "confidence": 0.977 + }, + { + "text": "one", + "start": 35.42, + "end": 35.44, + "confidence": 0.974 + }, + { + "text": "who", + "start": 35.44, + "end": 35.46, + "confidence": 0.928 + }, + { + "text": "is", + "start": 35.46, + "end": 35.48, + "confidence": 0.988 + }, + { + "text": "the", + "start": 35.48, + "end": 35.5, + "confidence": 0.977 + }, + { + "text": "one", + "start": 35.5, + "end": 35.52, + "confidence": 0.974 + }, + { + "text": "who", + "start": 35.52, + "end": 35.54, + "confidence": 0.926 + }, + { + "text": "is", + "start": 35.54, + "end": 35.56, + "confidence": 0.988 + }, + { + "text": "the", + "start": 35.56, + "end": 35.58, + "confidence": 0.977 + }, + { + "text": "one", + "start": 35.58, + "end": 35.6, + "confidence": 0.974 + }, + { + "text": "who", + "start": 35.6, + "end": 35.62, + "confidence": 0.928 + }, + { + "text": "is", + "start": 35.62, + "end": 35.64, + "confidence": 0.988 + }, + { + "text": "the", + "start": 35.64, + "end": 35.66, + "confidence": 0.977 + }, + { + "text": "one", + "start": 35.66, + "end": 35.68, + "confidence": 0.974 + }, + { + "text": "who", + "start": 35.68, + "end": 35.7, + "confidence": 0.926 + }, + { + "text": "is", + "start": 35.7, + "end": 35.72, + "confidence": 0.988 + }, + { + "text": "the", + "start": 35.72, + "end": 35.74, + "confidence": 0.978 + }, + { + "text": "one", + "start": 35.74, + "end": 35.76, + "confidence": 0.974 + }, + { + "text": "who", + "start": 35.76, + "end": 35.78, + "confidence": 0.928 + }, + { + "text": "is", + "start": 35.78, + "end": 35.8, + "confidence": 0.988 + }, + { + "text": "the", + "start": 35.8, + "end": 35.82, + "confidence": 0.978 + }, + { + "text": "one", + "start": 35.82, + "end": 35.84, + "confidence": 0.973 + }, + { + "text": "who", + "start": 35.84, + "end": 35.86, + "confidence": 0.926 + }, + { + "text": "is", + "start": 35.86, + "end": 35.88, + "confidence": 0.988 + }, + { + "text": "the", + "start": 35.88, + "end": 35.9, + "confidence": 0.977 + }, + { + "text": "one", + "start": 35.9, + "end": 35.92, + "confidence": 0.974 + }, + { + "text": "who", + "start": 35.92, + "end": 35.94, + "confidence": 0.928 + }, + { + "text": "is", + "start": 35.94, + "end": 35.96, + "confidence": 0.987 + }, + { + "text": "the", + "start": 35.96, + "end": 35.98, + "confidence": 0.977 + }, + { + "text": "one", + "start": 35.98, + "end": 36.0, + "confidence": 0.973 + }, + { + "text": "who", + "start": 36.0, + "end": 36.02, + "confidence": 0.925 + }, + { + "text": "is", + "start": 36.02, + "end": 36.04, + "confidence": 0.987 + }, + { + "text": "the", + "start": 36.04, + "end": 36.06, + "confidence": 0.977 + }, + { + "text": "one", + "start": 36.06, + "end": 36.08, + "confidence": 0.973 + }, + { + "text": "who", + "start": 36.08, + "end": 36.1, + "confidence": 0.925 + }, + { + "text": "is", + "start": 36.1, + "end": 36.12, + "confidence": 0.987 + }, + { + "text": "the", + "start": 36.12, + "end": 36.14, + "confidence": 0.977 + }, + { + "text": "one", + "start": 36.14, + "end": 36.16, + "confidence": 0.974 + }, + { + "text": "who", + "start": 36.16, + "end": 36.18, + "confidence": 0.927 + }, + { + "text": "is", + "start": 36.18, + "end": 36.2, + "confidence": 0.987 + }, + { + "text": "the", + "start": 36.2, + "end": 36.22, + "confidence": 0.977 + }, + { + "text": "one", + "start": 36.22, + "end": 36.24, + "confidence": 0.973 + }, + { + "text": "who", + "start": 36.24, + "end": 36.26, + "confidence": 0.923 + }, + { + "text": "is", + "start": 36.26, + "end": 36.28, + "confidence": 0.987 + }, + { + "text": "the", + "start": 36.28, + "end": 36.3, + "confidence": 0.977 + }, + { + "text": "one", + "start": 36.3, + "end": 36.32, + "confidence": 0.972 + }, + { + "text": "who", + "start": 36.32, + "end": 36.34, + "confidence": 0.924 + }, + { + "text": "is", + "start": 36.34, + "end": 36.36, + "confidence": 0.986 + }, + { + "text": "the", + "start": 36.36, + "end": 36.38, + "confidence": 0.976 + }, + { + "text": "one", + "start": 36.38, + "end": 36.4, + "confidence": 0.972 + }, + { + "text": "who", + "start": 36.4, + "end": 36.42, + "confidence": 0.922 + }, + { + "text": "is", + "start": 36.42, + "end": 36.44, + "confidence": 0.985 + }, + { + "text": "the", + "start": 36.44, + "end": 36.46, + "confidence": 0.976 + }, + { + "text": "one", + "start": 36.46, + "end": 36.48, + "confidence": 0.973 + }, + { + "text": "who", + "start": 36.48, + "end": 36.5, + "confidence": 0.924 + }, + { + "text": "is", + "start": 36.5, + "end": 36.52, + "confidence": 0.985 + }, + { + "text": "the", + "start": 36.52, + "end": 36.54, + "confidence": 0.975 + }, + { + "text": "one", + "start": 36.54, + "end": 36.56, + "confidence": 0.973 + }, + { + "text": "who", + "start": 36.56, + "end": 36.58, + "confidence": 0.92 + }, + { + "text": "is", + "start": 36.58, + "end": 36.6, + "confidence": 0.983 + }, + { + "text": "the", + "start": 36.6, + "end": 36.62, + "confidence": 0.975 + }, + { + "text": "one", + "start": 36.62, + "end": 36.64, + "confidence": 0.971 + }, + { + "text": "who", + "start": 36.64, + "end": 36.66, + "confidence": 0.921 + }, + { + "text": "is", + "start": 36.66, + "end": 36.68, + "confidence": 0.983 + }, + { + "text": "the", + "start": 36.68, + "end": 36.7, + "confidence": 0.974 + }, + { + "text": "one", + "start": 36.7, + "end": 36.72, + "confidence": 0.973 + }, + { + "text": "who", + "start": 36.72, + "end": 36.74, + "confidence": 0.918 + }, + { + "text": "is", + "start": 36.74, + "end": 36.76, + "confidence": 0.982 + }, + { + "text": "the", + "start": 36.76, + "end": 36.78, + "confidence": 0.974 + }, + { + "text": "one", + "start": 36.78, + "end": 36.8, + "confidence": 0.973 + }, + { + "text": "who", + "start": 36.8, + "end": 36.82, + "confidence": 0.919 + }, + { + "text": "is", + "start": 36.82, + "end": 36.84, + "confidence": 0.982 + }, + { + "text": "the", + "start": 36.84, + "end": 36.86, + "confidence": 0.973 + }, + { + "text": "one", + "start": 36.86, + "end": 36.88, + "confidence": 0.973 + }, + { + "text": "who", + "start": 36.88, + "end": 36.9, + "confidence": 0.917 + }, + { + "text": "is", + "start": 36.9, + "end": 36.92, + "confidence": 0.981 + }, + { + "text": "the", + "start": 36.92, + "end": 36.94, + "confidence": 0.973 + }, + { + "text": "one", + "start": 36.94, + "end": 36.96, + "confidence": 0.972 + }, + { + "text": "who", + "start": 36.96, + "end": 36.98, + "confidence": 0.919 + }, + { + "text": "is", + "start": 36.98, + "end": 37.0, + "confidence": 0.98 + }, + { + "text": "the", + "start": 37.0, + "end": 37.02, + "confidence": 0.972 + }, + { + "text": "one", + "start": 37.02, + "end": 37.04, + "confidence": 0.972 + }, + { + "text": "who", + "start": 37.04, + "end": 37.06, + "confidence": 0.918 + }, + { + "text": "is", + "start": 37.06, + "end": 37.08, + "confidence": 0.979 + }, + { + "text": "the", + "start": 37.08, + "end": 37.1, + "confidence": 0.972 + }, + { + "text": "one", + "start": 37.1, + "end": 37.12, + "confidence": 0.972 + }, + { + "text": "who", + "start": 37.12, + "end": 37.14, + "confidence": 0.917 + }, + { + "text": "is", + "start": 37.14, + "end": 37.16, + "confidence": 0.978 + }, + { + "text": "the", + "start": 37.16, + "end": 37.18, + "confidence": 0.971 + } + ] + }, + { + "id": 2, + "seek": 3700, + "start": 37.18, + "end": 66.98, + "text": " one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is the one who is", + "tokens": [ + 50363, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318, + 262, + 530, + 508, + 318 + ], + "temperature": 0.0, + "avg_logprob": -0.024528507656521266, + "compression_ratio": 26.93548387096774, + "no_speech_prob": 0.09981618076562881, + "confidence": 0.976, + "words": [ + { + "text": "one", + "start": 37.18, + "end": 37.32, + "confidence": 0.959 + }, + { + "text": "who", + "start": 37.32, + "end": 37.9, + "confidence": 0.954 + }, + { + "text": "is", + "start": 37.9, + "end": 37.92, + "confidence": 0.968 + }, + { + "text": "the", + "start": 37.92, + "end": 38.1, + "confidence": 0.962 + }, + { + "text": "one", + "start": 38.1, + "end": 38.6, + "confidence": 0.965 + }, + { + "text": "who", + "start": 38.6, + "end": 39.36, + "confidence": 0.979 + }, + { + "text": "is", + "start": 39.36, + "end": 39.58, + "confidence": 0.986 + }, + { + "text": "the", + "start": 39.58, + "end": 39.6, + "confidence": 0.969 + }, + { + "text": "one", + "start": 39.6, + "end": 39.62, + "confidence": 0.981 + }, + { + "text": "who", + "start": 39.62, + "end": 39.82, + "confidence": 0.985 + }, + { + "text": "is", + "start": 39.82, + "end": 40.12, + "confidence": 0.99 + }, + { + "text": "the", + "start": 40.12, + "end": 40.32, + "confidence": 0.957 + }, + { + "text": "one", + "start": 40.32, + "end": 40.62, + "confidence": 0.983 + }, + { + "text": "who", + "start": 40.62, + "end": 40.64, + "confidence": 0.984 + }, + { + "text": "is", + "start": 40.64, + "end": 40.66, + "confidence": 0.99 + }, + { + "text": "the", + "start": 40.66, + "end": 40.68, + "confidence": 0.956 + }, + { + "text": "one", + "start": 40.68, + "end": 40.74, + "confidence": 0.984 + }, + { + "text": "who", + "start": 40.74, + "end": 40.76, + "confidence": 0.984 + }, + { + "text": "is", + "start": 40.76, + "end": 40.78, + "confidence": 0.991 + }, + { + "text": "the", + "start": 40.78, + "end": 40.8, + "confidence": 0.953 + }, + { + "text": "one", + "start": 40.8, + "end": 40.82, + "confidence": 0.985 + }, + { + "text": "who", + "start": 40.82, + "end": 40.84, + "confidence": 0.979 + }, + { + "text": "is", + "start": 40.84, + "end": 40.86, + "confidence": 0.987 + }, + { + "text": "the", + "start": 40.86, + "end": 40.88, + "confidence": 0.495 + }, + { + "text": "one", + "start": 40.88, + "end": 41.5, + "confidence": 0.951 + }, + { + "text": "who", + "start": 41.5, + "end": 41.52, + "confidence": 0.968 + }, + { + "text": "is", + "start": 41.52, + "end": 41.54, + "confidence": 0.983 + }, + { + "text": "the", + "start": 41.54, + "end": 41.56, + "confidence": 0.844 + }, + { + "text": "one", + "start": 41.56, + "end": 41.58, + "confidence": 0.982 + }, + { + "text": "who", + "start": 41.58, + "end": 41.6, + "confidence": 0.973 + }, + { + "text": "is", + "start": 41.6, + "end": 41.62, + "confidence": 0.991 + }, + { + "text": "the", + "start": 41.62, + "end": 41.64, + "confidence": 0.888 + }, + { + "text": "one", + "start": 41.64, + "end": 41.66, + "confidence": 0.984 + }, + { + "text": "who", + "start": 41.66, + "end": 41.68, + "confidence": 0.978 + }, + { + "text": "is", + "start": 41.68, + "end": 41.7, + "confidence": 0.994 + }, + { + "text": "the", + "start": 41.7, + "end": 41.72, + "confidence": 0.915 + }, + { + "text": "one", + "start": 41.72, + "end": 41.74, + "confidence": 0.985 + }, + { + "text": "who", + "start": 41.74, + "end": 41.76, + "confidence": 0.981 + }, + { + "text": "is", + "start": 41.76, + "end": 41.78, + "confidence": 0.995 + }, + { + "text": "the", + "start": 41.78, + "end": 41.8, + "confidence": 0.937 + }, + { + "text": "one", + "start": 41.8, + "end": 41.82, + "confidence": 0.986 + }, + { + "text": "who", + "start": 41.82, + "end": 41.84, + "confidence": 0.983 + }, + { + "text": "is", + "start": 41.84, + "end": 41.86, + "confidence": 0.996 + }, + { + "text": "the", + "start": 41.86, + "end": 41.88, + "confidence": 0.95 + }, + { + "text": "one", + "start": 41.88, + "end": 41.9, + "confidence": 0.987 + }, + { + "text": "who", + "start": 41.9, + "end": 41.92, + "confidence": 0.983 + }, + { + "text": "is", + "start": 41.92, + "end": 41.94, + "confidence": 0.996 + }, + { + "text": "the", + "start": 41.94, + "end": 41.96, + "confidence": 0.961 + }, + { + "text": "one", + "start": 41.96, + "end": 41.98, + "confidence": 0.987 + }, + { + "text": "who", + "start": 41.98, + "end": 42.0, + "confidence": 0.984 + }, + { + "text": "is", + "start": 42.0, + "end": 42.02, + "confidence": 0.997 + }, + { + "text": "the", + "start": 42.02, + "end": 42.04, + "confidence": 0.969 + }, + { + "text": "one", + "start": 42.04, + "end": 42.06, + "confidence": 0.987 + }, + { + "text": "who", + "start": 42.06, + "end": 42.08, + "confidence": 0.983 + }, + { + "text": "is", + "start": 42.08, + "end": 42.1, + "confidence": 0.997 + }, + { + "text": "the", + "start": 42.1, + "end": 42.12, + "confidence": 0.975 + }, + { + "text": "one", + "start": 42.12, + "end": 42.14, + "confidence": 0.988 + }, + { + "text": "who", + "start": 42.14, + "end": 42.16, + "confidence": 0.983 + }, + { + "text": "is", + "start": 42.16, + "end": 42.18, + "confidence": 0.997 + }, + { + "text": "the", + "start": 42.18, + "end": 42.2, + "confidence": 0.979 + }, + { + "text": "one", + "start": 42.2, + "end": 42.22, + "confidence": 0.989 + }, + { + "text": "who", + "start": 42.22, + "end": 42.24, + "confidence": 0.983 + }, + { + "text": "is", + "start": 42.24, + "end": 42.26, + "confidence": 0.998 + }, + { + "text": "the", + "start": 42.26, + "end": 42.28, + "confidence": 0.982 + }, + { + "text": "one", + "start": 42.28, + "end": 42.3, + "confidence": 0.989 + }, + { + "text": "who", + "start": 42.3, + "end": 42.32, + "confidence": 0.982 + }, + { + "text": "is", + "start": 42.32, + "end": 42.34, + "confidence": 0.998 + }, + { + "text": "the", + "start": 42.34, + "end": 42.4, + "confidence": 0.983 + }, + { + "text": "one", + "start": 42.4, + "end": 42.56, + "confidence": 0.989 + }, + { + "text": "who", + "start": 42.56, + "end": 42.58, + "confidence": 0.982 + }, + { + "text": "is", + "start": 42.58, + "end": 42.62, + "confidence": 0.998 + }, + { + "text": "the", + "start": 42.62, + "end": 42.64, + "confidence": 0.985 + }, + { + "text": "one", + "start": 42.64, + "end": 43.62, + "confidence": 0.989 + }, + { + "text": "who", + "start": 43.62, + "end": 43.64, + "confidence": 0.981 + }, + { + "text": "is", + "start": 43.64, + "end": 43.66, + "confidence": 0.998 + }, + { + "text": "the", + "start": 43.66, + "end": 43.68, + "confidence": 0.986 + }, + { + "text": "one", + "start": 43.68, + "end": 43.7, + "confidence": 0.989 + }, + { + "text": "who", + "start": 43.7, + "end": 43.72, + "confidence": 0.981 + }, + { + "text": "is", + "start": 43.72, + "end": 43.74, + "confidence": 0.998 + }, + { + "text": "the", + "start": 43.74, + "end": 43.76, + "confidence": 0.987 + }, + { + "text": "one", + "start": 43.76, + "end": 44.02, + "confidence": 0.989 + }, + { + "text": "who", + "start": 44.02, + "end": 44.04, + "confidence": 0.981 + }, + { + "text": "is", + "start": 44.04, + "end": 44.06, + "confidence": 0.998 + }, + { + "text": "the", + "start": 44.06, + "end": 44.08, + "confidence": 0.988 + }, + { + "text": "one", + "start": 44.08, + "end": 44.1, + "confidence": 0.989 + }, + { + "text": "who", + "start": 44.1, + "end": 44.12, + "confidence": 0.981 + }, + { + "text": "is", + "start": 44.12, + "end": 44.14, + "confidence": 0.998 + }, + { + "text": "the", + "start": 44.14, + "end": 44.16, + "confidence": 0.988 + }, + { + "text": "one", + "start": 44.16, + "end": 44.18, + "confidence": 0.989 + }, + { + "text": "who", + "start": 44.18, + "end": 44.2, + "confidence": 0.981 + }, + { + "text": "is", + "start": 44.2, + "end": 44.22, + "confidence": 0.998 + }, + { + "text": "the", + "start": 44.22, + "end": 44.24, + "confidence": 0.988 + }, + { + "text": "one", + "start": 44.24, + "end": 44.26, + "confidence": 0.989 + }, + { + "text": "who", + "start": 44.26, + "end": 44.28, + "confidence": 0.98 + }, + { + "text": "is", + "start": 44.28, + "end": 44.3, + "confidence": 0.998 + }, + { + "text": "the", + "start": 44.3, + "end": 44.32, + "confidence": 0.988 + }, + { + "text": "one", + "start": 44.32, + "end": 44.34, + "confidence": 0.988 + }, + { + "text": "who", + "start": 44.34, + "end": 44.36, + "confidence": 0.98 + }, + { + "text": "is", + "start": 44.36, + "end": 44.38, + "confidence": 0.998 + }, + { + "text": "the", + "start": 44.38, + "end": 44.4, + "confidence": 0.988 + }, + { + "text": "one", + "start": 44.4, + "end": 44.42, + "confidence": 0.988 + }, + { + "text": "who", + "start": 44.42, + "end": 44.44, + "confidence": 0.98 + }, + { + "text": "is", + "start": 44.44, + "end": 44.46, + "confidence": 0.998 + }, + { + "text": "the", + "start": 44.46, + "end": 44.48, + "confidence": 0.988 + }, + { + "text": "one", + "start": 44.48, + "end": 44.54, + "confidence": 0.988 + }, + { + "text": "who", + "start": 44.54, + "end": 44.56, + "confidence": 0.98 + }, + { + "text": "is", + "start": 44.56, + "end": 44.58, + "confidence": 0.998 + }, + { + "text": "the", + "start": 44.58, + "end": 44.6, + "confidence": 0.988 + }, + { + "text": "one", + "start": 44.6, + "end": 45.16, + "confidence": 0.987 + }, + { + "text": "who", + "start": 45.16, + "end": 45.18, + "confidence": 0.98 + }, + { + "text": "is", + "start": 45.18, + "end": 45.2, + "confidence": 0.998 + }, + { + "text": "the", + "start": 45.2, + "end": 45.22, + "confidence": 0.988 + }, + { + "text": "one", + "start": 45.22, + "end": 45.24, + "confidence": 0.987 + }, + { + "text": "who", + "start": 45.24, + "end": 45.26, + "confidence": 0.979 + }, + { + "text": "is", + "start": 45.26, + "end": 45.28, + "confidence": 0.998 + }, + { + "text": "the", + "start": 45.28, + "end": 45.3, + "confidence": 0.988 + }, + { + "text": "one", + "start": 45.3, + "end": 45.32, + "confidence": 0.986 + }, + { + "text": "who", + "start": 45.32, + "end": 45.34, + "confidence": 0.978 + }, + { + "text": "is", + "start": 45.34, + "end": 45.36, + "confidence": 0.998 + }, + { + "text": "the", + "start": 45.36, + "end": 45.38, + "confidence": 0.988 + }, + { + "text": "one", + "start": 45.38, + "end": 45.4, + "confidence": 0.986 + }, + { + "text": "who", + "start": 45.4, + "end": 45.42, + "confidence": 0.977 + }, + { + "text": "is", + "start": 45.42, + "end": 45.44, + "confidence": 0.998 + }, + { + "text": "the", + "start": 45.44, + "end": 45.46, + "confidence": 0.988 + }, + { + "text": "one", + "start": 45.46, + "end": 45.94, + "confidence": 0.985 + }, + { + "text": "who", + "start": 45.94, + "end": 45.96, + "confidence": 0.975 + }, + { + "text": "is", + "start": 45.96, + "end": 45.98, + "confidence": 0.997 + }, + { + "text": "the", + "start": 45.98, + "end": 46.0, + "confidence": 0.988 + }, + { + "text": "one", + "start": 46.0, + "end": 46.02, + "confidence": 0.985 + }, + { + "text": "who", + "start": 46.02, + "end": 46.04, + "confidence": 0.976 + }, + { + "text": "is", + "start": 46.04, + "end": 46.06, + "confidence": 0.997 + }, + { + "text": "the", + "start": 46.06, + "end": 46.08, + "confidence": 0.988 + }, + { + "text": "one", + "start": 46.08, + "end": 46.1, + "confidence": 0.984 + }, + { + "text": "who", + "start": 46.1, + "end": 46.12, + "confidence": 0.975 + }, + { + "text": "is", + "start": 46.12, + "end": 46.14, + "confidence": 0.997 + }, + { + "text": "the", + "start": 46.14, + "end": 46.16, + "confidence": 0.987 + }, + { + "text": "one", + "start": 46.16, + "end": 46.18, + "confidence": 0.984 + }, + { + "text": "who", + "start": 46.18, + "end": 46.2, + "confidence": 0.971 + }, + { + "text": "is", + "start": 46.2, + "end": 46.22, + "confidence": 0.997 + }, + { + "text": "the", + "start": 46.22, + "end": 46.24, + "confidence": 0.986 + }, + { + "text": "one", + "start": 46.24, + "end": 46.26, + "confidence": 0.983 + }, + { + "text": "who", + "start": 46.26, + "end": 46.28, + "confidence": 0.971 + }, + { + "text": "is", + "start": 46.28, + "end": 46.3, + "confidence": 0.996 + }, + { + "text": "the", + "start": 46.3, + "end": 46.32, + "confidence": 0.986 + }, + { + "text": "one", + "start": 46.32, + "end": 46.84, + "confidence": 0.982 + }, + { + "text": "who", + "start": 46.84, + "end": 46.86, + "confidence": 0.969 + }, + { + "text": "is", + "start": 46.86, + "end": 46.88, + "confidence": 0.996 + }, + { + "text": "the", + "start": 46.88, + "end": 46.9, + "confidence": 0.986 + }, + { + "text": "one", + "start": 46.9, + "end": 46.92, + "confidence": 0.982 + }, + { + "text": "who", + "start": 46.92, + "end": 46.94, + "confidence": 0.966 + }, + { + "text": "is", + "start": 46.94, + "end": 46.96, + "confidence": 0.996 + }, + { + "text": "the", + "start": 46.96, + "end": 46.98, + "confidence": 0.985 + }, + { + "text": "one", + "start": 46.98, + "end": 47.1, + "confidence": 0.982 + }, + { + "text": "who", + "start": 47.1, + "end": 47.12, + "confidence": 0.966 + }, + { + "text": "is", + "start": 47.12, + "end": 47.14, + "confidence": 0.995 + }, + { + "text": "the", + "start": 47.14, + "end": 47.16, + "confidence": 0.985 + }, + { + "text": "one", + "start": 47.16, + "end": 47.18, + "confidence": 0.982 + }, + { + "text": "who", + "start": 47.18, + "end": 47.2, + "confidence": 0.963 + }, + { + "text": "is", + "start": 47.2, + "end": 47.22, + "confidence": 0.995 + }, + { + "text": "the", + "start": 47.22, + "end": 47.24, + "confidence": 0.984 + }, + { + "text": "one", + "start": 47.24, + "end": 47.26, + "confidence": 0.98 + }, + { + "text": "who", + "start": 47.26, + "end": 47.28, + "confidence": 0.959 + }, + { + "text": "is", + "start": 47.28, + "end": 47.3, + "confidence": 0.994 + }, + { + "text": "the", + "start": 47.3, + "end": 47.32, + "confidence": 0.983 + }, + { + "text": "one", + "start": 47.32, + "end": 47.34, + "confidence": 0.98 + }, + { + "text": "who", + "start": 47.34, + "end": 47.36, + "confidence": 0.958 + }, + { + "text": "is", + "start": 47.36, + "end": 47.38, + "confidence": 0.994 + }, + { + "text": "the", + "start": 47.38, + "end": 47.4, + "confidence": 0.983 + }, + { + "text": "one", + "start": 47.4, + "end": 47.6, + "confidence": 0.979 + }, + { + "text": "who", + "start": 47.6, + "end": 47.62, + "confidence": 0.955 + }, + { + "text": "is", + "start": 47.62, + "end": 47.64, + "confidence": 0.993 + }, + { + "text": "the", + "start": 47.64, + "end": 47.66, + "confidence": 0.982 + }, + { + "text": "one", + "start": 47.66, + "end": 47.68, + "confidence": 0.98 + }, + { + "text": "who", + "start": 47.68, + "end": 47.7, + "confidence": 0.956 + }, + { + "text": "is", + "start": 47.7, + "end": 47.72, + "confidence": 0.993 + }, + { + "text": "the", + "start": 47.72, + "end": 47.74, + "confidence": 0.981 + }, + { + "text": "one", + "start": 47.74, + "end": 47.76, + "confidence": 0.978 + }, + { + "text": "who", + "start": 47.76, + "end": 47.78, + "confidence": 0.949 + }, + { + "text": "is", + "start": 47.78, + "end": 47.8, + "confidence": 0.992 + }, + { + "text": "the", + "start": 47.8, + "end": 47.82, + "confidence": 0.98 + }, + { + "text": "one", + "start": 47.82, + "end": 49.1, + "confidence": 0.978 + }, + { + "text": "who", + "start": 49.1, + "end": 49.12, + "confidence": 0.948 + }, + { + "text": "is", + "start": 49.12, + "end": 49.14, + "confidence": 0.991 + }, + { + "text": "the", + "start": 49.14, + "end": 49.16, + "confidence": 0.98 + }, + { + "text": "one", + "start": 49.16, + "end": 49.26, + "confidence": 0.978 + }, + { + "text": "who", + "start": 49.26, + "end": 49.28, + "confidence": 0.949 + }, + { + "text": "is", + "start": 49.28, + "end": 49.3, + "confidence": 0.991 + }, + { + "text": "the", + "start": 49.3, + "end": 49.32, + "confidence": 0.979 + }, + { + "text": "one", + "start": 49.32, + "end": 49.34, + "confidence": 0.977 + }, + { + "text": "who", + "start": 49.34, + "end": 49.36, + "confidence": 0.944 + }, + { + "text": "is", + "start": 49.36, + "end": 49.38, + "confidence": 0.99 + }, + { + "text": "the", + "start": 49.38, + "end": 49.4, + "confidence": 0.977 + }, + { + "text": "one", + "start": 49.4, + "end": 49.42, + "confidence": 0.976 + }, + { + "text": "who", + "start": 49.42, + "end": 49.44, + "confidence": 0.94 + }, + { + "text": "is", + "start": 49.44, + "end": 49.46, + "confidence": 0.989 + }, + { + "text": "the", + "start": 49.46, + "end": 49.48, + "confidence": 0.977 + }, + { + "text": "one", + "start": 49.48, + "end": 49.5, + "confidence": 0.975 + }, + { + "text": "who", + "start": 49.5, + "end": 49.52, + "confidence": 0.94 + }, + { + "text": "is", + "start": 49.52, + "end": 49.54, + "confidence": 0.989 + }, + { + "text": "the", + "start": 49.54, + "end": 49.56, + "confidence": 0.975 + }, + { + "text": "one", + "start": 49.56, + "end": 49.58, + "confidence": 0.975 + }, + { + "text": "who", + "start": 49.58, + "end": 49.6, + "confidence": 0.935 + }, + { + "text": "is", + "start": 49.6, + "end": 49.62, + "confidence": 0.987 + }, + { + "text": "the", + "start": 49.62, + "end": 49.64, + "confidence": 0.974 + }, + { + "text": "one", + "start": 49.64, + "end": 49.66, + "confidence": 0.975 + }, + { + "text": "who", + "start": 49.66, + "end": 49.68, + "confidence": 0.936 + }, + { + "text": "is", + "start": 49.68, + "end": 49.7, + "confidence": 0.988 + }, + { + "text": "the", + "start": 49.7, + "end": 49.72, + "confidence": 0.974 + }, + { + "text": "one", + "start": 49.72, + "end": 49.74, + "confidence": 0.971 + }, + { + "text": "who", + "start": 49.74, + "end": 49.76, + "confidence": 0.932 + }, + { + "text": "is", + "start": 49.76, + "end": 49.78, + "confidence": 0.986 + }, + { + "text": "the", + "start": 49.78, + "end": 49.8, + "confidence": 0.971 + }, + { + "text": "one", + "start": 49.8, + "end": 49.82, + "confidence": 0.971 + }, + { + "text": "who", + "start": 49.82, + "end": 49.84, + "confidence": 0.928 + }, + { + "text": "is", + "start": 49.84, + "end": 49.86, + "confidence": 0.986 + }, + { + "text": "the", + "start": 49.86, + "end": 49.88, + "confidence": 0.971 + }, + { + "text": "one", + "start": 49.88, + "end": 49.9, + "confidence": 0.971 + }, + { + "text": "who", + "start": 49.9, + "end": 49.92, + "confidence": 0.923 + }, + { + "text": "is", + "start": 49.92, + "end": 49.94, + "confidence": 0.985 + }, + { + "text": "the", + "start": 49.94, + "end": 49.96, + "confidence": 0.97 + }, + { + "text": "one", + "start": 49.96, + "end": 66.64, + "confidence": 0.969 + }, + { + "text": "who", + "start": 66.64, + "end": 66.66, + "confidence": 0.925 + }, + { + "text": "is", + "start": 66.66, + "end": 66.98, + "confidence": 0.985 + } + ] + } + ], + "language": "en" +} \ No newline at end of file diff --git a/tests/expected/split_subtitles/punctuations.mp3_20.srt b/tests/expected/split_subtitles/punctuations.mp3_20.srt new file mode 100644 index 0000000000000000000000000000000000000000..607f0125cf1df1d150f8432a5ce5ad72669143df --- /dev/null +++ b/tests/expected/split_subtitles/punctuations.mp3_20.srt @@ -0,0 +1,12 @@ +1 +00:00:00,400 --> 00:00:01,360 +Dis-moi, + +2 +00:00:01,360 --> 00:00:02,020 +est-ce que l'avion + +3 +00:00:02,020 --> 00:00:02,340 +vole? + diff --git a/tests/expected/split_subtitles/punctuations.mp3_20.vtt b/tests/expected/split_subtitles/punctuations.mp3_20.vtt new file mode 100644 index 0000000000000000000000000000000000000000..d06e85098725e851017bd86f94fa529b5c66d030 --- /dev/null +++ b/tests/expected/split_subtitles/punctuations.mp3_20.vtt @@ -0,0 +1,11 @@ +WEBVTT + +00:00.400 --> 00:01.360 +Dis-moi, + +00:01.360 --> 00:02.020 +est-ce que l'avion + +00:02.020 --> 00:02.340 +vole? + diff --git a/tests/expected/split_subtitles/punctuations.mp3_50.srt b/tests/expected/split_subtitles/punctuations.mp3_50.srt new file mode 100644 index 0000000000000000000000000000000000000000..ffc9a2b42b2c510691ec27b303df2c88825c0aa4 --- /dev/null +++ b/tests/expected/split_subtitles/punctuations.mp3_50.srt @@ -0,0 +1,4 @@ +1 +00:00:00,400 --> 00:00:02,340 +Dis-moi, est-ce que l'avion vole? + diff --git a/tests/expected/split_subtitles/punctuations.mp3_50.vtt b/tests/expected/split_subtitles/punctuations.mp3_50.vtt new file mode 100644 index 0000000000000000000000000000000000000000..83c7bd9a0253ca6a8d117803fac3a2bdc3b9e525 --- /dev/null +++ b/tests/expected/split_subtitles/punctuations.mp3_50.vtt @@ -0,0 +1,5 @@ +WEBVTT + +00:00.400 --> 00:02.340 +Dis-moi, est-ce que l'avion vole? + diff --git a/tests/expected/split_subtitles/punctuations.mp3_6.srt b/tests/expected/split_subtitles/punctuations.mp3_6.srt new file mode 100644 index 0000000000000000000000000000000000000000..0caea3d7e82a647c78c154e2d1879292e5442c9d --- /dev/null +++ b/tests/expected/split_subtitles/punctuations.mp3_6.srt @@ -0,0 +1,20 @@ +1 +00:00:00,400 --> 00:00:01,360 +Dis-moi, + +2 +00:00:01,360 --> 00:00:01,520 +est-ce + +3 +00:00:01,520 --> 00:00:01,640 +que + +4 +00:00:01,640 --> 00:00:02,020 +l'avion + +5 +00:00:02,020 --> 00:00:02,340 +vole? + diff --git a/tests/expected/split_subtitles/punctuations.mp3_6.vtt b/tests/expected/split_subtitles/punctuations.mp3_6.vtt new file mode 100644 index 0000000000000000000000000000000000000000..f255e42075a222812432fc82fe6622c86de71015 --- /dev/null +++ b/tests/expected/split_subtitles/punctuations.mp3_6.vtt @@ -0,0 +1,17 @@ +WEBVTT + +00:00.400 --> 00:01.360 +Dis-moi, + +00:01.360 --> 00:01.520 +est-ce + +00:01.520 --> 00:01.640 +que + +00:01.640 --> 00:02.020 +l'avion + +00:02.020 --> 00:02.340 +vole? + diff --git a/tests/expected/split_subtitles/smartphone.mp3_20.srt b/tests/expected/split_subtitles/smartphone.mp3_20.srt new file mode 100644 index 0000000000000000000000000000000000000000..22c039440f6cb0beda8f9ccf043d766a717ac78a --- /dev/null +++ b/tests/expected/split_subtitles/smartphone.mp3_20.srt @@ -0,0 +1,812 @@ +1 +00:00:00,380 --> 00:00:01,080 +C'est évident ce que + +2 +00:00:01,080 --> 00:00:01,780 +dit Nicolas, + +3 +00:00:01,780 --> 00:00:02,380 +mais je ne me + +4 +00:00:02,380 --> 00:00:02,840 +l'étais jamais + +5 +00:00:02,840 --> 00:00:03,620 +formulé comme ça. + +6 +00:00:04,080 --> 00:00:05,000 +Ce qui fait la force + +7 +00:00:05,000 --> 00:00:05,880 +du smartphone, + +8 +00:00:05,880 --> 00:00:06,520 +c'est pas seulement + +9 +00:00:06,520 --> 00:00:07,560 +l'accumulation des + +10 +00:00:07,560 --> 00:00:07,920 +fonctions, + +11 +00:00:08,320 --> 00:00:09,100 +mais la manière dont + +12 +00:00:09,100 --> 00:00:10,320 +elles interagissent + +13 +00:00:10,320 --> 00:00:10,880 +entre elles. + +14 +00:00:10,960 --> 00:00:11,400 +Ce qui dit + +15 +00:00:11,400 --> 00:00:11,780 +d'ailleurs sur la + +16 +00:00:11,780 --> 00:00:12,120 +photo, + +17 +00:00:12,120 --> 00:00:13,000 +c'est hyper convaincant. + +18 +00:00:13,340 --> 00:00:14,340 +Alors évidemment, + +19 +00:00:14,340 --> 00:00:15,160 +il faudrait ajouter + +20 +00:00:15,160 --> 00:00:16,020 +les interfaces. + +21 +00:00:16,220 --> 00:00:17,260 +L'écran tactile a + +22 +00:00:17,260 --> 00:00:18,620 +été beaucoup très + +23 +00:00:18,620 --> 00:00:19,360 +souvent mentionné. + +24 +00:00:19,840 --> 00:00:20,520 +Mais bon, + +25 +00:00:20,520 --> 00:00:20,960 +il faut dire qu'il + +26 +00:00:20,960 --> 00:00:22,100 +profite aussi de 20 + +27 +00:00:22,100 --> 00:00:22,920 +ans pendant lesquels + +28 +00:00:22,920 --> 00:00:23,720 +les ordinateurs nous + +29 +00:00:23,720 --> 00:00:24,500 +ont appris à cliquer + +30 +00:00:24,500 --> 00:00:25,260 +sur des icônes. + +31 +00:00:25,420 --> 00:00:26,660 +Sauf que le + +32 +00:00:26,660 --> 00:00:27,620 +smartphone ajoute le + +33 +00:00:27,620 --> 00:00:28,180 +toucher, + +34 +00:00:28,180 --> 00:00:28,680 +ce qui rend le + +35 +00:00:28,680 --> 00:00:30,220 +contact plus direct, + +36 +00:00:30,220 --> 00:00:30,640 +plus sensible. + +37 +00:00:31,040 --> 00:00:31,700 +Et puis évidemment, + +38 +00:00:31,700 --> 00:00:32,120 +il faudrait parler + +39 +00:00:32,120 --> 00:00:32,480 +aussi des + +40 +00:00:32,480 --> 00:00:33,180 +applications qui + +41 +00:00:33,180 --> 00:00:33,960 +permettent de + +42 +00:00:33,960 --> 00:00:34,800 +contourner le côté + +43 +00:00:34,800 --> 00:00:35,780 +touffu de la + +44 +00:00:35,780 --> 00:00:36,780 +navigation web pour + +45 +00:00:36,780 --> 00:00:37,680 +aller directement au + +46 +00:00:37,680 --> 00:00:37,820 +but. + +47 +00:00:37,820 --> 00:00:39,420 +Bref, tout ça, + +48 +00:00:39,420 --> 00:00:40,160 +ce sont les + +49 +00:00:40,160 --> 00:00:40,960 +conditions qui + +50 +00:00:40,960 --> 00:00:42,060 +permettent de créer + +51 +00:00:42,060 --> 00:00:42,800 +cet objet dont + +52 +00:00:42,800 --> 00:00:43,700 +Nicolas dit qu'il + +53 +00:00:43,700 --> 00:00:43,880 +est + +54 +00:00:43,880 --> 00:00:44,980 +vraisemblablement + +55 +00:00:44,980 --> 00:00:45,700 +inédit dans + +56 +00:00:45,700 --> 00:00:46,180 +l'histoire de + +57 +00:00:46,180 --> 00:00:46,580 +l'humanité. + +58 +00:00:46,600 --> 00:00:47,720 +Mais ça, + +59 +00:00:47,720 --> 00:00:48,260 +ça soulève une autre + +60 +00:00:48,260 --> 00:00:48,820 +interrogation. + +61 +00:00:49,220 --> 00:00:49,980 +Est-ce que le fait + +62 +00:00:49,980 --> 00:00:51,120 +que cet objet soit + +63 +00:00:51,120 --> 00:00:52,420 +inédit induit que + +64 +00:00:52,420 --> 00:00:53,660 +notre rapport à lui + +65 +00:00:53,660 --> 00:00:55,000 +est aussi un rapport + +66 +00:00:55,000 --> 00:00:55,460 +inédit? + +67 +00:00:55,460 --> 00:00:56,240 +Je veux dire, + +68 +00:00:56,240 --> 00:00:56,580 +est-ce que le + +69 +00:00:56,580 --> 00:00:57,280 +rapport qu'on a au + +70 +00:00:57,280 --> 00:00:57,920 +smartphone est + +71 +00:00:57,920 --> 00:00:58,660 +comparable à celui + +72 +00:00:58,660 --> 00:00:59,460 +qu'on entretenait à + +73 +00:00:59,460 --> 00:00:59,960 +d'autres objets + +74 +00:00:59,960 --> 00:01:01,500 +techniques comme la + +75 +00:01:01,500 --> 00:01:02,680 +voiture ou le + +76 +00:01:02,680 --> 00:01:03,120 +téléphone? + +77 +00:01:03,360 --> 00:01:05,660 +Il n'y a pas + +78 +00:01:05,660 --> 00:01:06,420 +d'équivalent en + +79 +00:01:06,420 --> 00:01:06,660 +fait. + +80 +00:01:06,880 --> 00:01:07,540 +Et donc cette espèce + +81 +00:01:07,540 --> 00:01:08,940 +de nouveauté dans la + +82 +00:01:08,940 --> 00:01:10,240 +relation à l'objet, + +83 +00:01:10,240 --> 00:01:10,760 +c'est fascinant et + +84 +00:01:10,760 --> 00:01:11,520 +terrifiant. + +85 +00:01:11,620 --> 00:01:12,440 +Parce qu'on a + +86 +00:01:12,440 --> 00:01:13,560 +l'impression, + +87 +00:01:13,560 --> 00:01:14,400 +comme le disent les + +88 +00:01:14,400 --> 00:01:15,000 +utilisateurs et les + +89 +00:01:15,000 --> 00:01:15,220 +services, + +90 +00:01:15,220 --> 00:01:16,080 +d'être dépendants de + +91 +00:01:16,080 --> 00:01:16,480 +cet objet, + +92 +00:01:16,860 --> 00:01:17,340 +d'induire en fait + +93 +00:01:17,340 --> 00:01:18,480 +une espèce de + +94 +00:01:18,480 --> 00:01:18,600 +relation, + +95 +00:01:18,600 --> 00:01:19,920 +de médiation avec le + +96 +00:01:19,920 --> 00:01:21,780 +monde qui rend de + +97 +00:01:21,780 --> 00:01:22,240 +l'ampleur et qui + +98 +00:01:22,240 --> 00:01:22,720 +amène aussi à des + +99 +00:01:22,720 --> 00:01:23,260 +formes de rejet. + +100 +00:01:23,940 --> 00:01:24,940 +Donc, + +101 +00:01:24,940 --> 00:01:26,560 +à objet inédit, + +102 +00:01:26,560 --> 00:01:27,800 +rapport inédit. + +103 +00:01:28,020 --> 00:01:29,280 +Et ce rapport, + +104 +00:01:29,280 --> 00:01:29,880 +si j'en crois + +105 +00:01:29,880 --> 00:01:30,540 +Nicolas, + +106 +00:01:30,540 --> 00:01:31,800 +serait caractérisé + +107 +00:01:31,800 --> 00:01:33,400 +par un mélange de + +108 +00:01:33,400 --> 00:01:34,680 +dépendance et de + +109 +00:01:34,680 --> 00:01:35,140 +rejet. + +110 +00:01:35,780 --> 00:01:37,140 +Bon, en vrai, + +111 +00:01:37,140 --> 00:01:38,080 +il faudrait remonter + +112 +00:01:38,080 --> 00:01:39,320 +très très finement + +113 +00:01:39,320 --> 00:01:40,240 +toute l'histoire des + +114 +00:01:40,240 --> 00:01:41,480 +objets techniques et + +115 +00:01:41,480 --> 00:01:42,320 +de leur insertion + +116 +00:01:42,320 --> 00:01:42,860 +dans nos vies + +117 +00:01:42,900 --> 00:01:43,760 +pour déterminer si + +118 +00:01:43,760 --> 00:01:44,740 +ce rapport est + +119 +00:01:44,740 --> 00:01:45,740 +totalement inédit. + +120 +00:01:46,100 --> 00:01:46,920 +Mais j'ai + +121 +00:01:46,920 --> 00:01:47,560 +l'impression comme + +122 +00:01:47,560 --> 00:01:48,700 +ça que Nicolas ne se + +123 +00:01:48,700 --> 00:01:49,340 +trompe pas vraiment. + +124 +00:01:49,880 --> 00:01:50,520 +Pour autant que je + +125 +00:01:50,520 --> 00:01:51,140 +sache, + +126 +00:01:51,140 --> 00:01:52,060 +il y a eu plein de + +127 +00:01:52,060 --> 00:01:52,940 +discussions autour + +128 +00:01:52,940 --> 00:01:54,060 +de la voiture ou + +129 +00:01:54,060 --> 00:01:54,980 +même du téléphone. + +130 +00:01:55,340 --> 00:01:56,400 +Mais la dépendance + +131 +00:01:56,400 --> 00:01:57,460 +n'était pas du même + +132 +00:01:57,460 --> 00:01:57,780 +ordre. + +133 +00:01:57,780 --> 00:01:58,780 +Donc le rejet non + +134 +00:01:58,780 --> 00:01:59,380 +plus n'était pas du + +135 +00:01:59,380 --> 00:01:59,840 +même ordre. + +136 +00:01:59,980 --> 00:02:00,880 +On peut adorer sa + +137 +00:02:00,880 --> 00:02:01,460 +bagnole, + +138 +00:02:01,460 --> 00:02:02,340 +en avoir besoin pour + +139 +00:02:02,340 --> 00:02:03,020 +plein de choses. + +140 +00:02:03,280 --> 00:02:04,680 +Et bien, le soir, + +141 +00:02:04,680 --> 00:02:05,380 +quand on va se + +142 +00:02:05,380 --> 00:02:05,800 +coucher, + +143 +00:02:05,800 --> 00:02:06,360 +on la laisse. + +144 +00:02:06,980 --> 00:02:07,800 +On ne l'a pas dans + +145 +00:02:07,800 --> 00:02:08,680 +la main quand on est + +146 +00:02:08,680 --> 00:02:09,140 +au lit, + +147 +00:02:09,140 --> 00:02:09,680 +on ne l'emmène pas + +148 +00:02:09,680 --> 00:02:10,480 +au chiottes. + +149 +00:02:10,860 --> 00:02:11,480 +On pouvait être + +150 +00:02:11,480 --> 00:02:13,100 +énervé par son môme + +151 +00:02:13,100 --> 00:02:13,800 +qui occupait la + +152 +00:02:13,800 --> 00:02:14,600 +ligne de téléphone + +153 +00:02:14,600 --> 00:02:15,360 +pendant une heure + +154 +00:02:15,360 --> 00:02:15,960 +chaque soir pour + +155 +00:02:15,960 --> 00:02:16,600 +discuter avec un + +156 +00:02:16,600 --> 00:02:16,900 +copain. + +157 +00:02:17,280 --> 00:02:17,940 +Mais ça ne + +158 +00:02:17,940 --> 00:02:18,980 +ressemblait pas à ce + +159 +00:02:18,980 --> 00:02:20,120 +qu'on peut ressentir + +160 +00:02:20,120 --> 00:02:21,340 +à voir ce même môme + +161 +00:02:21,340 --> 00:02:21,880 +aujourd'hui, + +162 +00:02:22,140 --> 00:02:23,180 +continuellement avec + +163 +00:02:23,180 --> 00:02:23,940 +son smartphone dans + +164 +00:02:23,940 --> 00:02:24,360 +la main, + +165 +00:02:24,360 --> 00:02:25,060 +comme si c'était une + +166 +00:02:25,060 --> 00:02:25,820 +sorte de pacemaker + +167 +00:02:25,820 --> 00:02:26,300 +externe, + +168 +00:02:26,340 --> 00:02:27,360 +comme si le lâcher + +169 +00:02:27,360 --> 00:02:28,000 +allait entraîner sa + +170 +00:02:28,000 --> 00:02:28,840 +mort immédiate. + +171 +00:02:29,040 --> 00:02:29,280 +Bon, + +172 +00:02:29,280 --> 00:02:29,880 +je dis ça pour le + +173 +00:02:29,880 --> 00:02:30,320 +môme, + +174 +00:02:30,320 --> 00:02:31,140 +mais c'est évidemment + +175 +00:02:31,140 --> 00:02:31,760 +valable pour nous + +176 +00:02:31,760 --> 00:02:31,960 +aussi. + +177 +00:02:32,340 --> 00:02:33,460 +Donc, + +178 +00:02:33,460 --> 00:02:34,240 +rapport inédit. + +179 +00:02:34,240 --> 00:02:35,480 +D'accord. + +180 +00:02:35,480 --> 00:02:36,680 +Mais pourquoi a-t-on + +181 +00:02:36,680 --> 00:02:37,260 +l'impression qu'on + +182 +00:02:37,260 --> 00:02:38,220 +n'en sortira jamais? + +183 +00:02:38,860 --> 00:02:39,780 +Est-ce qu'il faut en + +184 +00:02:39,780 --> 00:02:40,660 +remettre la faute + +185 +00:02:40,660 --> 00:02:41,720 +sur les gens qui ont + +186 +00:02:41,720 --> 00:02:42,780 +créé cet outil + +187 +00:02:42,780 --> 00:02:43,500 +merveilleux et + +188 +00:02:43,500 --> 00:02:43,860 +diabolique, + +189 +00:02:43,860 --> 00:02:44,660 +et diabolique parce + +190 +00:02:44,660 --> 00:02:45,320 +que merveilleux? + +191 +00:02:46,340 --> 00:02:47,480 +Les économistes + +192 +00:02:47,480 --> 00:02:47,820 +parlent de + +193 +00:02:47,820 --> 00:02:48,500 +dépendance du + +194 +00:02:48,500 --> 00:02:48,820 +sentier. + +195 +00:02:48,860 --> 00:02:49,700 +C'est l'idée qu'on + +196 +00:02:49,700 --> 00:02:50,780 +est sur un sentier + +197 +00:02:50,780 --> 00:02:51,900 +qui a été établi, + +198 +00:02:51,900 --> 00:02:52,720 +soit volontairement + +199 +00:02:52,720 --> 00:02:54,240 +en marchant dessus, + +200 +00:02:54,240 --> 00:02:55,500 +soit en définissant + +201 +00:02:55,500 --> 00:02:56,040 +des bornes, + +202 +00:02:56,040 --> 00:02:56,820 +en définissant une + +203 +00:02:56,820 --> 00:02:57,420 +signalétique. + diff --git a/tests/expected/split_subtitles/smartphone.mp3_20.vtt b/tests/expected/split_subtitles/smartphone.mp3_20.vtt new file mode 100644 index 0000000000000000000000000000000000000000..b880a5ca949532022a422bc316c7efd245866555 --- /dev/null +++ b/tests/expected/split_subtitles/smartphone.mp3_20.vtt @@ -0,0 +1,611 @@ +WEBVTT + +00:00.380 --> 00:01.080 +C'est évident ce que + +00:01.080 --> 00:01.780 +dit Nicolas, + +00:01.780 --> 00:02.380 +mais je ne me + +00:02.380 --> 00:02.840 +l'étais jamais + +00:02.840 --> 00:03.620 +formulé comme ça. + +00:04.080 --> 00:05.000 +Ce qui fait la force + +00:05.000 --> 00:05.880 +du smartphone, + +00:05.880 --> 00:06.520 +c'est pas seulement + +00:06.520 --> 00:07.560 +l'accumulation des + +00:07.560 --> 00:07.920 +fonctions, + +00:08.320 --> 00:09.100 +mais la manière dont + +00:09.100 --> 00:10.320 +elles interagissent + +00:10.320 --> 00:10.880 +entre elles. + +00:10.960 --> 00:11.400 +Ce qui dit + +00:11.400 --> 00:11.780 +d'ailleurs sur la + +00:11.780 --> 00:12.120 +photo, + +00:12.120 --> 00:13.000 +c'est hyper convaincant. + +00:13.340 --> 00:14.340 +Alors évidemment, + +00:14.340 --> 00:15.160 +il faudrait ajouter + +00:15.160 --> 00:16.020 +les interfaces. + +00:16.220 --> 00:17.260 +L'écran tactile a + +00:17.260 --> 00:18.620 +été beaucoup très + +00:18.620 --> 00:19.360 +souvent mentionné. + +00:19.840 --> 00:20.520 +Mais bon, + +00:20.520 --> 00:20.960 +il faut dire qu'il + +00:20.960 --> 00:22.100 +profite aussi de 20 + +00:22.100 --> 00:22.920 +ans pendant lesquels + +00:22.920 --> 00:23.720 +les ordinateurs nous + +00:23.720 --> 00:24.500 +ont appris à cliquer + +00:24.500 --> 00:25.260 +sur des icônes. + +00:25.420 --> 00:26.660 +Sauf que le + +00:26.660 --> 00:27.620 +smartphone ajoute le + +00:27.620 --> 00:28.180 +toucher, + +00:28.180 --> 00:28.680 +ce qui rend le + +00:28.680 --> 00:30.220 +contact plus direct, + +00:30.220 --> 00:30.640 +plus sensible. + +00:31.040 --> 00:31.700 +Et puis évidemment, + +00:31.700 --> 00:32.120 +il faudrait parler + +00:32.120 --> 00:32.480 +aussi des + +00:32.480 --> 00:33.180 +applications qui + +00:33.180 --> 00:33.960 +permettent de + +00:33.960 --> 00:34.800 +contourner le côté + +00:34.800 --> 00:35.780 +touffu de la + +00:35.780 --> 00:36.780 +navigation web pour + +00:36.780 --> 00:37.680 +aller directement au + +00:37.680 --> 00:37.820 +but. + +00:37.820 --> 00:39.420 +Bref, tout ça, + +00:39.420 --> 00:40.160 +ce sont les + +00:40.160 --> 00:40.960 +conditions qui + +00:40.960 --> 00:42.060 +permettent de créer + +00:42.060 --> 00:42.800 +cet objet dont + +00:42.800 --> 00:43.700 +Nicolas dit qu'il + +00:43.700 --> 00:43.880 +est + +00:43.880 --> 00:44.980 +vraisemblablement + +00:44.980 --> 00:45.700 +inédit dans + +00:45.700 --> 00:46.180 +l'histoire de + +00:46.180 --> 00:46.580 +l'humanité. + +00:46.600 --> 00:47.720 +Mais ça, + +00:47.720 --> 00:48.260 +ça soulève une autre + +00:48.260 --> 00:48.820 +interrogation. + +00:49.220 --> 00:49.980 +Est-ce que le fait + +00:49.980 --> 00:51.120 +que cet objet soit + +00:51.120 --> 00:52.420 +inédit induit que + +00:52.420 --> 00:53.660 +notre rapport à lui + +00:53.660 --> 00:55.000 +est aussi un rapport + +00:55.000 --> 00:55.460 +inédit? + +00:55.460 --> 00:56.240 +Je veux dire, + +00:56.240 --> 00:56.580 +est-ce que le + +00:56.580 --> 00:57.280 +rapport qu'on a au + +00:57.280 --> 00:57.920 +smartphone est + +00:57.920 --> 00:58.660 +comparable à celui + +00:58.660 --> 00:59.460 +qu'on entretenait à + +00:59.460 --> 00:59.960 +d'autres objets + +00:59.960 --> 01:01.500 +techniques comme la + +01:01.500 --> 01:02.680 +voiture ou le + +01:02.680 --> 01:03.120 +téléphone? + +01:03.360 --> 01:05.660 +Il n'y a pas + +01:05.660 --> 01:06.420 +d'équivalent en + +01:06.420 --> 01:06.660 +fait. + +01:06.880 --> 01:07.540 +Et donc cette espèce + +01:07.540 --> 01:08.940 +de nouveauté dans la + +01:08.940 --> 01:10.240 +relation à l'objet, + +01:10.240 --> 01:10.760 +c'est fascinant et + +01:10.760 --> 01:11.520 +terrifiant. + +01:11.620 --> 01:12.440 +Parce qu'on a + +01:12.440 --> 01:13.560 +l'impression, + +01:13.560 --> 01:14.400 +comme le disent les + +01:14.400 --> 01:15.000 +utilisateurs et les + +01:15.000 --> 01:15.220 +services, + +01:15.220 --> 01:16.080 +d'être dépendants de + +01:16.080 --> 01:16.480 +cet objet, + +01:16.860 --> 01:17.340 +d'induire en fait + +01:17.340 --> 01:18.480 +une espèce de + +01:18.480 --> 01:18.600 +relation, + +01:18.600 --> 01:19.920 +de médiation avec le + +01:19.920 --> 01:21.780 +monde qui rend de + +01:21.780 --> 01:22.240 +l'ampleur et qui + +01:22.240 --> 01:22.720 +amène aussi à des + +01:22.720 --> 01:23.260 +formes de rejet. + +01:23.940 --> 01:24.940 +Donc, + +01:24.940 --> 01:26.560 +à objet inédit, + +01:26.560 --> 01:27.800 +rapport inédit. + +01:28.020 --> 01:29.280 +Et ce rapport, + +01:29.280 --> 01:29.880 +si j'en crois + +01:29.880 --> 01:30.540 +Nicolas, + +01:30.540 --> 01:31.800 +serait caractérisé + +01:31.800 --> 01:33.400 +par un mélange de + +01:33.400 --> 01:34.680 +dépendance et de + +01:34.680 --> 01:35.140 +rejet. + +01:35.780 --> 01:37.140 +Bon, en vrai, + +01:37.140 --> 01:38.080 +il faudrait remonter + +01:38.080 --> 01:39.320 +très très finement + +01:39.320 --> 01:40.240 +toute l'histoire des + +01:40.240 --> 01:41.480 +objets techniques et + +01:41.480 --> 01:42.320 +de leur insertion + +01:42.320 --> 01:42.860 +dans nos vies + +01:42.900 --> 01:43.760 +pour déterminer si + +01:43.760 --> 01:44.740 +ce rapport est + +01:44.740 --> 01:45.740 +totalement inédit. + +01:46.100 --> 01:46.920 +Mais j'ai + +01:46.920 --> 01:47.560 +l'impression comme + +01:47.560 --> 01:48.700 +ça que Nicolas ne se + +01:48.700 --> 01:49.340 +trompe pas vraiment. + +01:49.880 --> 01:50.520 +Pour autant que je + +01:50.520 --> 01:51.140 +sache, + +01:51.140 --> 01:52.060 +il y a eu plein de + +01:52.060 --> 01:52.940 +discussions autour + +01:52.940 --> 01:54.060 +de la voiture ou + +01:54.060 --> 01:54.980 +même du téléphone. + +01:55.340 --> 01:56.400 +Mais la dépendance + +01:56.400 --> 01:57.460 +n'était pas du même + +01:57.460 --> 01:57.780 +ordre. + +01:57.780 --> 01:58.780 +Donc le rejet non + +01:58.780 --> 01:59.380 +plus n'était pas du + +01:59.380 --> 01:59.840 +même ordre. + +01:59.980 --> 02:00.880 +On peut adorer sa + +02:00.880 --> 02:01.460 +bagnole, + +02:01.460 --> 02:02.340 +en avoir besoin pour + +02:02.340 --> 02:03.020 +plein de choses. + +02:03.280 --> 02:04.680 +Et bien, le soir, + +02:04.680 --> 02:05.380 +quand on va se + +02:05.380 --> 02:05.800 +coucher, + +02:05.800 --> 02:06.360 +on la laisse. + +02:06.980 --> 02:07.800 +On ne l'a pas dans + +02:07.800 --> 02:08.680 +la main quand on est + +02:08.680 --> 02:09.140 +au lit, + +02:09.140 --> 02:09.680 +on ne l'emmène pas + +02:09.680 --> 02:10.480 +au chiottes. + +02:10.860 --> 02:11.480 +On pouvait être + +02:11.480 --> 02:13.100 +énervé par son môme + +02:13.100 --> 02:13.800 +qui occupait la + +02:13.800 --> 02:14.600 +ligne de téléphone + +02:14.600 --> 02:15.360 +pendant une heure + +02:15.360 --> 02:15.960 +chaque soir pour + +02:15.960 --> 02:16.600 +discuter avec un + +02:16.600 --> 02:16.900 +copain. + +02:17.280 --> 02:17.940 +Mais ça ne + +02:17.940 --> 02:18.980 +ressemblait pas à ce + +02:18.980 --> 02:20.120 +qu'on peut ressentir + +02:20.120 --> 02:21.340 +à voir ce même môme + +02:21.340 --> 02:21.880 +aujourd'hui, + +02:22.140 --> 02:23.180 +continuellement avec + +02:23.180 --> 02:23.940 +son smartphone dans + +02:23.940 --> 02:24.360 +la main, + +02:24.360 --> 02:25.060 +comme si c'était une + +02:25.060 --> 02:25.820 +sorte de pacemaker + +02:25.820 --> 02:26.300 +externe, + +02:26.340 --> 02:27.360 +comme si le lâcher + +02:27.360 --> 02:28.000 +allait entraîner sa + +02:28.000 --> 02:28.840 +mort immédiate. + +02:29.040 --> 02:29.280 +Bon, + +02:29.280 --> 02:29.880 +je dis ça pour le + +02:29.880 --> 02:30.320 +môme, + +02:30.320 --> 02:31.140 +mais c'est évidemment + +02:31.140 --> 02:31.760 +valable pour nous + +02:31.760 --> 02:31.960 +aussi. + +02:32.340 --> 02:33.460 +Donc, + +02:33.460 --> 02:34.240 +rapport inédit. + +02:34.240 --> 02:35.480 +D'accord. + +02:35.480 --> 02:36.680 +Mais pourquoi a-t-on + +02:36.680 --> 02:37.260 +l'impression qu'on + +02:37.260 --> 02:38.220 +n'en sortira jamais? + +02:38.860 --> 02:39.780 +Est-ce qu'il faut en + +02:39.780 --> 02:40.660 +remettre la faute + +02:40.660 --> 02:41.720 +sur les gens qui ont + +02:41.720 --> 02:42.780 +créé cet outil + +02:42.780 --> 02:43.500 +merveilleux et + +02:43.500 --> 02:43.860 +diabolique, + +02:43.860 --> 02:44.660 +et diabolique parce + +02:44.660 --> 02:45.320 +que merveilleux? + +02:46.340 --> 02:47.480 +Les économistes + +02:47.480 --> 02:47.820 +parlent de + +02:47.820 --> 02:48.500 +dépendance du + +02:48.500 --> 02:48.820 +sentier. + +02:48.860 --> 02:49.700 +C'est l'idée qu'on + +02:49.700 --> 02:50.780 +est sur un sentier + +02:50.780 --> 02:51.900 +qui a été établi, + +02:51.900 --> 02:52.720 +soit volontairement + +02:52.720 --> 02:54.240 +en marchant dessus, + +02:54.240 --> 02:55.500 +soit en définissant + +02:55.500 --> 02:56.040 +des bornes, + +02:56.040 --> 02:56.820 +en définissant une + +02:56.820 --> 02:57.420 +signalétique. + diff --git a/tests/expected/split_subtitles/smartphone.mp3_50.srt b/tests/expected/split_subtitles/smartphone.mp3_50.srt new file mode 100644 index 0000000000000000000000000000000000000000..5a9cbd960d9a7073f91c8d0412e7daf0f797d25c --- /dev/null +++ b/tests/expected/split_subtitles/smartphone.mp3_50.srt @@ -0,0 +1,356 @@ +1 +00:00:00,380 --> 00:00:01,780 +C'est évident ce que dit Nicolas, + +2 +00:00:01,780 --> 00:00:03,620 +mais je ne me l'étais jamais formulé comme ça. + +3 +00:00:04,080 --> 00:00:05,880 +Ce qui fait la force du smartphone, + +4 +00:00:05,880 --> 00:00:07,920 +c'est pas seulement l'accumulation des fonctions, + +5 +00:00:08,320 --> 00:00:10,580 +mais la manière dont elles interagissent entre + +6 +00:00:10,580 --> 00:00:10,880 +elles. + +7 +00:00:10,960 --> 00:00:12,120 +Ce qui dit d'ailleurs sur la photo, + +8 +00:00:12,120 --> 00:00:13,000 +c'est hyper convaincant. + +9 +00:00:13,340 --> 00:00:14,340 +Alors évidemment, + +10 +00:00:14,340 --> 00:00:16,020 +il faudrait ajouter les interfaces. + +11 +00:00:16,220 --> 00:00:18,900 +L'écran tactile a été beaucoup très souvent + +12 +00:00:18,900 --> 00:00:19,360 +mentionné. + +13 +00:00:19,840 --> 00:00:20,520 +Mais bon, + +14 +00:00:20,520 --> 00:00:22,480 +il faut dire qu'il profite aussi de 20 ans pendant + +15 +00:00:22,480 --> 00:00:24,500 +lesquels les ordinateurs nous ont appris à cliquer + +16 +00:00:24,500 --> 00:00:25,260 +sur des icônes. + +17 +00:00:25,420 --> 00:00:28,180 +Sauf que le smartphone ajoute le toucher, + +18 +00:00:28,180 --> 00:00:30,640 +ce qui rend le contact plus direct, plus sensible. + +19 +00:00:31,040 --> 00:00:31,700 +Et puis évidemment, + +20 +00:00:31,700 --> 00:00:33,180 +il faudrait parler aussi des applications qui + +21 +00:00:33,180 --> 00:00:35,780 +permettent de contourner le côté touffu de la + +22 +00:00:35,780 --> 00:00:37,820 +navigation web pour aller directement au but. + +23 +00:00:37,820 --> 00:00:39,420 +Bref, tout ça, + +24 +00:00:39,420 --> 00:00:42,380 +ce sont les conditions qui permettent de créer cet + +25 +00:00:42,380 --> 00:00:44,980 +objet dont Nicolas dit qu'il est vraisemblablement + +26 +00:00:44,980 --> 00:00:46,580 +inédit dans l'histoire de l'humanité. + +27 +00:00:46,600 --> 00:00:48,820 +Mais ça, ça soulève une autre interrogation. + +28 +00:00:49,220 --> 00:00:51,800 +Est-ce que le fait que cet objet soit inédit + +29 +00:00:51,800 --> 00:00:54,700 +induit que notre rapport à lui est aussi un + +30 +00:00:54,700 --> 00:00:55,460 +rapport inédit? + +31 +00:00:55,460 --> 00:00:56,240 +Je veux dire, + +32 +00:00:56,240 --> 00:00:57,920 +est-ce que le rapport qu'on a au smartphone est + +33 +00:00:57,920 --> 00:00:59,700 +comparable à celui qu'on entretenait à d'autres + +34 +00:00:59,700 --> 00:01:02,680 +objets techniques comme la voiture ou le + +35 +00:01:02,680 --> 00:01:03,120 +téléphone? + +36 +00:01:03,360 --> 00:01:06,660 +Il n'y a pas d'équivalent en fait. + +37 +00:01:06,880 --> 00:01:09,220 +Et donc cette espèce de nouveauté dans la relation + +38 +00:01:09,220 --> 00:01:11,520 +à l'objet, c'est fascinant et terrifiant. + +39 +00:01:11,620 --> 00:01:13,560 +Parce qu'on a l'impression, + +40 +00:01:13,560 --> 00:01:15,220 +comme le disent les utilisateurs et les services, + +41 +00:01:15,220 --> 00:01:16,480 +d'être dépendants de cet objet, + +42 +00:01:16,860 --> 00:01:18,600 +d'induire en fait une espèce de relation, + +43 +00:01:18,600 --> 00:01:22,020 +de médiation avec le monde qui rend de l'ampleur + +44 +00:01:22,020 --> 00:01:23,260 +et qui amène aussi à des formes de rejet. + +45 +00:01:23,940 --> 00:01:27,800 +Donc, à objet inédit, rapport inédit. + +46 +00:01:28,020 --> 00:01:30,540 +Et ce rapport, si j'en crois Nicolas, + +47 +00:01:30,540 --> 00:01:34,540 +serait caractérisé par un mélange de dépendance et + +48 +00:01:34,540 --> 00:01:35,140 +de rejet. + +49 +00:01:35,780 --> 00:01:37,140 +Bon, en vrai, + +50 +00:01:37,140 --> 00:01:39,700 +il faudrait remonter très très finement toute + +51 +00:01:39,700 --> 00:01:41,840 +l'histoire des objets techniques et de leur + +52 +00:01:41,840 --> 00:01:42,860 +insertion dans nos vies + +53 +00:01:42,900 --> 00:01:45,300 +pour déterminer si ce rapport est totalement + +54 +00:01:45,300 --> 00:01:45,740 +inédit. + +55 +00:01:46,100 --> 00:01:48,700 +Mais j'ai l'impression comme ça que Nicolas ne se + +56 +00:01:48,700 --> 00:01:49,340 +trompe pas vraiment. + +57 +00:01:49,880 --> 00:01:51,140 +Pour autant que je sache, + +58 +00:01:51,140 --> 00:01:53,520 +il y a eu plein de discussions autour de la + +59 +00:01:53,520 --> 00:01:54,980 +voiture ou même du téléphone. + +60 +00:01:55,340 --> 00:01:57,780 +Mais la dépendance n'était pas du même ordre. + +61 +00:01:57,780 --> 00:01:59,840 +Donc le rejet non plus n'était pas du même ordre. + +62 +00:01:59,980 --> 00:02:01,460 +On peut adorer sa bagnole, + +63 +00:02:01,460 --> 00:02:03,020 +en avoir besoin pour plein de choses. + +64 +00:02:03,280 --> 00:02:05,800 +Et bien, le soir, quand on va se coucher, + +65 +00:02:05,800 --> 00:02:06,360 +on la laisse. + +66 +00:02:06,980 --> 00:02:09,140 +On ne l'a pas dans la main quand on est au lit, + +67 +00:02:09,140 --> 00:02:10,480 +on ne l'emmène pas au chiottes. + +68 +00:02:10,860 --> 00:02:13,760 +On pouvait être énervé par son môme qui occupait + +69 +00:02:13,760 --> 00:02:15,540 +la ligne de téléphone pendant une heure chaque + +70 +00:02:15,540 --> 00:02:16,900 +soir pour discuter avec un copain. + +71 +00:02:17,280 --> 00:02:19,480 +Mais ça ne ressemblait pas à ce qu'on peut + +72 +00:02:19,480 --> 00:02:21,880 +ressentir à voir ce même môme aujourd'hui, + +73 +00:02:22,140 --> 00:02:24,360 +continuellement avec son smartphone dans la main, + +74 +00:02:24,360 --> 00:02:26,300 +comme si c'était une sorte de pacemaker externe, + +75 +00:02:26,340 --> 00:02:28,220 +comme si le lâcher allait entraîner sa mort + +76 +00:02:28,220 --> 00:02:28,840 +immédiate. + +77 +00:02:29,040 --> 00:02:30,320 +Bon, je dis ça pour le môme, + +78 +00:02:30,320 --> 00:02:31,960 +mais c'est évidemment valable pour nous aussi. + +79 +00:02:32,340 --> 00:02:35,480 +Donc, rapport inédit. D'accord. + +80 +00:02:35,480 --> 00:02:37,440 +Mais pourquoi a-t-on l'impression qu'on n'en + +81 +00:02:37,440 --> 00:02:38,220 +sortira jamais? + +82 +00:02:38,860 --> 00:02:41,280 +Est-ce qu'il faut en remettre la faute sur les + +83 +00:02:41,280 --> 00:02:43,500 +gens qui ont créé cet outil merveilleux et + +84 +00:02:43,500 --> 00:02:45,320 +diabolique, et diabolique parce que merveilleux? + +85 +00:02:46,340 --> 00:02:48,820 +Les économistes parlent de dépendance du sentier. + +86 +00:02:48,860 --> 00:02:51,120 +C'est l'idée qu'on est sur un sentier qui a été + +87 +00:02:51,120 --> 00:02:54,240 +établi, soit volontairement en marchant dessus, + +88 +00:02:54,240 --> 00:02:56,040 +soit en définissant des bornes, + +89 +00:02:56,040 --> 00:02:57,420 +en définissant une signalétique. + diff --git a/tests/expected/split_subtitles/smartphone.mp3_50.vtt b/tests/expected/split_subtitles/smartphone.mp3_50.vtt new file mode 100644 index 0000000000000000000000000000000000000000..68d9b01306781ba2fcb81166b675053824255222 --- /dev/null +++ b/tests/expected/split_subtitles/smartphone.mp3_50.vtt @@ -0,0 +1,269 @@ +WEBVTT + +00:00.380 --> 00:01.780 +C'est évident ce que dit Nicolas, + +00:01.780 --> 00:03.620 +mais je ne me l'étais jamais formulé comme ça. + +00:04.080 --> 00:05.880 +Ce qui fait la force du smartphone, + +00:05.880 --> 00:07.920 +c'est pas seulement l'accumulation des fonctions, + +00:08.320 --> 00:10.580 +mais la manière dont elles interagissent entre + +00:10.580 --> 00:10.880 +elles. + +00:10.960 --> 00:12.120 +Ce qui dit d'ailleurs sur la photo, + +00:12.120 --> 00:13.000 +c'est hyper convaincant. + +00:13.340 --> 00:14.340 +Alors évidemment, + +00:14.340 --> 00:16.020 +il faudrait ajouter les interfaces. + +00:16.220 --> 00:18.900 +L'écran tactile a été beaucoup très souvent + +00:18.900 --> 00:19.360 +mentionné. + +00:19.840 --> 00:20.520 +Mais bon, + +00:20.520 --> 00:22.480 +il faut dire qu'il profite aussi de 20 ans pendant + +00:22.480 --> 00:24.500 +lesquels les ordinateurs nous ont appris à cliquer + +00:24.500 --> 00:25.260 +sur des icônes. + +00:25.420 --> 00:28.180 +Sauf que le smartphone ajoute le toucher, + +00:28.180 --> 00:30.640 +ce qui rend le contact plus direct, plus sensible. + +00:31.040 --> 00:31.700 +Et puis évidemment, + +00:31.700 --> 00:33.180 +il faudrait parler aussi des applications qui + +00:33.180 --> 00:35.780 +permettent de contourner le côté touffu de la + +00:35.780 --> 00:37.820 +navigation web pour aller directement au but. + +00:37.820 --> 00:39.420 +Bref, tout ça, + +00:39.420 --> 00:42.380 +ce sont les conditions qui permettent de créer cet + +00:42.380 --> 00:44.980 +objet dont Nicolas dit qu'il est vraisemblablement + +00:44.980 --> 00:46.580 +inédit dans l'histoire de l'humanité. + +00:46.600 --> 00:48.820 +Mais ça, ça soulève une autre interrogation. + +00:49.220 --> 00:51.800 +Est-ce que le fait que cet objet soit inédit + +00:51.800 --> 00:54.700 +induit que notre rapport à lui est aussi un + +00:54.700 --> 00:55.460 +rapport inédit? + +00:55.460 --> 00:56.240 +Je veux dire, + +00:56.240 --> 00:57.920 +est-ce que le rapport qu'on a au smartphone est + +00:57.920 --> 00:59.700 +comparable à celui qu'on entretenait à d'autres + +00:59.700 --> 01:02.680 +objets techniques comme la voiture ou le + +01:02.680 --> 01:03.120 +téléphone? + +01:03.360 --> 01:06.660 +Il n'y a pas d'équivalent en fait. + +01:06.880 --> 01:09.220 +Et donc cette espèce de nouveauté dans la relation + +01:09.220 --> 01:11.520 +à l'objet, c'est fascinant et terrifiant. + +01:11.620 --> 01:13.560 +Parce qu'on a l'impression, + +01:13.560 --> 01:15.220 +comme le disent les utilisateurs et les services, + +01:15.220 --> 01:16.480 +d'être dépendants de cet objet, + +01:16.860 --> 01:18.600 +d'induire en fait une espèce de relation, + +01:18.600 --> 01:22.020 +de médiation avec le monde qui rend de l'ampleur + +01:22.020 --> 01:23.260 +et qui amène aussi à des formes de rejet. + +01:23.940 --> 01:27.800 +Donc, à objet inédit, rapport inédit. + +01:28.020 --> 01:30.540 +Et ce rapport, si j'en crois Nicolas, + +01:30.540 --> 01:34.540 +serait caractérisé par un mélange de dépendance et + +01:34.540 --> 01:35.140 +de rejet. + +01:35.780 --> 01:37.140 +Bon, en vrai, + +01:37.140 --> 01:39.700 +il faudrait remonter très très finement toute + +01:39.700 --> 01:41.840 +l'histoire des objets techniques et de leur + +01:41.840 --> 01:42.860 +insertion dans nos vies + +01:42.900 --> 01:45.300 +pour déterminer si ce rapport est totalement + +01:45.300 --> 01:45.740 +inédit. + +01:46.100 --> 01:48.700 +Mais j'ai l'impression comme ça que Nicolas ne se + +01:48.700 --> 01:49.340 +trompe pas vraiment. + +01:49.880 --> 01:51.140 +Pour autant que je sache, + +01:51.140 --> 01:53.520 +il y a eu plein de discussions autour de la + +01:53.520 --> 01:54.980 +voiture ou même du téléphone. + +01:55.340 --> 01:57.780 +Mais la dépendance n'était pas du même ordre. + +01:57.780 --> 01:59.840 +Donc le rejet non plus n'était pas du même ordre. + +01:59.980 --> 02:01.460 +On peut adorer sa bagnole, + +02:01.460 --> 02:03.020 +en avoir besoin pour plein de choses. + +02:03.280 --> 02:05.800 +Et bien, le soir, quand on va se coucher, + +02:05.800 --> 02:06.360 +on la laisse. + +02:06.980 --> 02:09.140 +On ne l'a pas dans la main quand on est au lit, + +02:09.140 --> 02:10.480 +on ne l'emmène pas au chiottes. + +02:10.860 --> 02:13.760 +On pouvait être énervé par son môme qui occupait + +02:13.760 --> 02:15.540 +la ligne de téléphone pendant une heure chaque + +02:15.540 --> 02:16.900 +soir pour discuter avec un copain. + +02:17.280 --> 02:19.480 +Mais ça ne ressemblait pas à ce qu'on peut + +02:19.480 --> 02:21.880 +ressentir à voir ce même môme aujourd'hui, + +02:22.140 --> 02:24.360 +continuellement avec son smartphone dans la main, + +02:24.360 --> 02:26.300 +comme si c'était une sorte de pacemaker externe, + +02:26.340 --> 02:28.220 +comme si le lâcher allait entraîner sa mort + +02:28.220 --> 02:28.840 +immédiate. + +02:29.040 --> 02:30.320 +Bon, je dis ça pour le môme, + +02:30.320 --> 02:31.960 +mais c'est évidemment valable pour nous aussi. + +02:32.340 --> 02:35.480 +Donc, rapport inédit. D'accord. + +02:35.480 --> 02:37.440 +Mais pourquoi a-t-on l'impression qu'on n'en + +02:37.440 --> 02:38.220 +sortira jamais? + +02:38.860 --> 02:41.280 +Est-ce qu'il faut en remettre la faute sur les + +02:41.280 --> 02:43.500 +gens qui ont créé cet outil merveilleux et + +02:43.500 --> 02:45.320 +diabolique, et diabolique parce que merveilleux? + +02:46.340 --> 02:48.820 +Les économistes parlent de dépendance du sentier. + +02:48.860 --> 02:51.120 +C'est l'idée qu'on est sur un sentier qui a été + +02:51.120 --> 02:54.240 +établi, soit volontairement en marchant dessus, + +02:54.240 --> 02:56.040 +soit en définissant des bornes, + +02:56.040 --> 02:57.420 +en définissant une signalétique. + diff --git a/tests/expected/split_subtitles/smartphone.mp3_6.srt b/tests/expected/split_subtitles/smartphone.mp3_6.srt new file mode 100644 index 0000000000000000000000000000000000000000..e03246f80d846a479b5404c598c34d50b8266e96 --- /dev/null +++ b/tests/expected/split_subtitles/smartphone.mp3_6.srt @@ -0,0 +1,2024 @@ +1 +00:00:00,380 --> 00:00:00,580 +C'est + +2 +00:00:00,580 --> 00:00:00,880 +évident + +3 +00:00:00,880 --> 00:00:01,080 +ce que + +4 +00:00:01,080 --> 00:00:01,200 +dit + +5 +00:00:01,200 --> 00:00:01,780 +Nicolas, + +6 +00:00:01,780 --> 00:00:01,900 +mais + +7 +00:00:01,900 --> 00:00:02,340 +je ne + +8 +00:00:02,340 --> 00:00:02,380 +me + +9 +00:00:02,380 --> 00:00:02,580 +l'étais + +10 +00:00:02,580 --> 00:00:02,840 +jamais + +11 +00:00:02,840 --> 00:00:03,260 +formulé + +12 +00:00:03,260 --> 00:00:03,420 +comme + +13 +00:00:03,420 --> 00:00:03,620 +ça. + +14 +00:00:04,080 --> 00:00:04,340 +Ce qui + +15 +00:00:04,340 --> 00:00:04,480 +fait + +16 +00:00:04,480 --> 00:00:04,660 +la + +17 +00:00:04,660 --> 00:00:05,000 +force + +18 +00:00:05,000 --> 00:00:05,200 +du + +19 +00:00:05,200 --> 00:00:05,880 +smartphone, + +20 +00:00:05,880 --> 00:00:06,120 +c'est + +21 +00:00:06,120 --> 00:00:06,260 +pas + +22 +00:00:06,260 --> 00:00:06,520 +seulement + +23 +00:00:06,520 --> 00:00:07,380 +l'accumulation + +24 +00:00:07,380 --> 00:00:07,560 +des + +25 +00:00:07,560 --> 00:00:07,920 +fonctions, + +26 +00:00:08,320 --> 00:00:08,440 +mais + +27 +00:00:08,440 --> 00:00:08,600 +la + +28 +00:00:08,600 --> 00:00:08,900 +manière + +29 +00:00:08,900 --> 00:00:09,100 +dont + +30 +00:00:09,100 --> 00:00:09,480 +elles + +31 +00:00:09,480 --> 00:00:10,320 +interagissent + +32 +00:00:10,320 --> 00:00:10,580 +entre + +33 +00:00:10,580 --> 00:00:10,880 +elles. + +34 +00:00:10,960 --> 00:00:11,220 +Ce qui + +35 +00:00:11,220 --> 00:00:11,400 +dit + +36 +00:00:11,400 --> 00:00:11,560 +d'ailleurs + +37 +00:00:11,560 --> 00:00:11,780 +sur la + +38 +00:00:11,780 --> 00:00:12,120 +photo, + +39 +00:00:12,120 --> 00:00:12,200 +c'est + +40 +00:00:12,200 --> 00:00:12,420 +hyper + +41 +00:00:12,420 --> 00:00:13,000 +convaincant. + +42 +00:00:13,340 --> 00:00:13,620 +Alors + +43 +00:00:13,620 --> 00:00:14,340 +évidemment, + +44 +00:00:14,340 --> 00:00:14,380 +il + +45 +00:00:14,380 --> 00:00:14,740 +faudrait + +46 +00:00:14,740 --> 00:00:15,160 +ajouter + +47 +00:00:15,160 --> 00:00:15,520 +les + +48 +00:00:15,520 --> 00:00:16,020 +interfaces. + +49 +00:00:16,220 --> 00:00:16,700 +L'écran + +50 +00:00:16,700 --> 00:00:17,060 +tactile + +51 +00:00:17,060 --> 00:00:17,880 +a été + +52 +00:00:17,880 --> 00:00:18,280 +beaucoup + +53 +00:00:18,280 --> 00:00:18,620 +très + +54 +00:00:18,620 --> 00:00:18,900 +souvent + +55 +00:00:18,900 --> 00:00:19,360 +mentionné. + +56 +00:00:19,840 --> 00:00:20,220 +Mais + +57 +00:00:20,220 --> 00:00:20,520 +bon, + +58 +00:00:20,520 --> 00:00:20,600 +il + +59 +00:00:20,600 --> 00:00:20,700 +faut + +60 +00:00:20,700 --> 00:00:20,840 +dire + +61 +00:00:20,840 --> 00:00:20,960 +qu'il + +62 +00:00:20,960 --> 00:00:21,260 +profite + +63 +00:00:21,260 --> 00:00:21,680 +aussi + +64 +00:00:21,680 --> 00:00:22,100 +de 20 + +65 +00:00:22,100 --> 00:00:22,320 +ans + +66 +00:00:22,320 --> 00:00:22,480 +pendant + +67 +00:00:22,480 --> 00:00:22,920 +lesquels + +68 +00:00:22,920 --> 00:00:23,040 +les + +69 +00:00:23,040 --> 00:00:23,540 +ordinateurs + +70 +00:00:23,540 --> 00:00:23,720 +nous + +71 +00:00:23,720 --> 00:00:23,820 +ont + +72 +00:00:23,820 --> 00:00:24,100 +appris + +73 +00:00:24,100 --> 00:00:24,240 +à + +74 +00:00:24,240 --> 00:00:24,500 +cliquer + +75 +00:00:24,500 --> 00:00:24,660 +sur + +76 +00:00:24,660 --> 00:00:24,940 +des + +77 +00:00:24,940 --> 00:00:25,260 +icônes. + +78 +00:00:25,420 --> 00:00:25,760 +Sauf + +79 +00:00:25,760 --> 00:00:26,660 +que le + +80 +00:00:26,660 --> 00:00:27,060 +smartphone + +81 +00:00:27,060 --> 00:00:27,440 +ajoute + +82 +00:00:27,440 --> 00:00:27,620 +le + +83 +00:00:27,620 --> 00:00:28,180 +toucher, + +84 +00:00:28,180 --> 00:00:28,280 +ce qui + +85 +00:00:28,280 --> 00:00:28,480 +rend + +86 +00:00:28,480 --> 00:00:28,680 +le + +87 +00:00:28,680 --> 00:00:29,100 +contact + +88 +00:00:29,100 --> 00:00:29,460 +plus + +89 +00:00:29,460 --> 00:00:30,220 +direct, + +90 +00:00:30,220 --> 00:00:30,260 +plus + +91 +00:00:30,260 --> 00:00:30,640 +sensible. + +92 +00:00:31,040 --> 00:00:31,220 +Et + +93 +00:00:31,220 --> 00:00:31,360 +puis + +94 +00:00:31,360 --> 00:00:31,700 +évidemment, + +95 +00:00:31,700 --> 00:00:31,740 +il + +96 +00:00:31,740 --> 00:00:31,940 +faudrait + +97 +00:00:31,940 --> 00:00:32,120 +parler + +98 +00:00:32,120 --> 00:00:32,340 +aussi + +99 +00:00:32,340 --> 00:00:32,480 +des + +100 +00:00:32,480 --> 00:00:32,900 +applications + +101 +00:00:32,900 --> 00:00:33,180 +qui + +102 +00:00:33,180 --> 00:00:33,740 +permettent + +103 +00:00:33,740 --> 00:00:33,960 +de + +104 +00:00:33,960 --> 00:00:34,420 +contourner + +105 +00:00:34,420 --> 00:00:34,520 +le + +106 +00:00:34,520 --> 00:00:34,800 +côté + +107 +00:00:34,800 --> 00:00:35,320 +touffu + +108 +00:00:35,320 --> 00:00:35,780 +de la + +109 +00:00:35,780 --> 00:00:36,240 +navigation + +110 +00:00:36,240 --> 00:00:36,600 +web + +111 +00:00:36,600 --> 00:00:36,780 +pour + +112 +00:00:36,780 --> 00:00:36,980 +aller + +113 +00:00:36,980 --> 00:00:37,520 +directement + +114 +00:00:37,520 --> 00:00:37,680 +au + +115 +00:00:37,680 --> 00:00:37,820 +but. + +116 +00:00:37,820 --> 00:00:38,760 +Bref, + +117 +00:00:38,760 --> 00:00:38,980 +tout + +118 +00:00:38,980 --> 00:00:39,420 +ça, + +119 +00:00:39,420 --> 00:00:39,880 +ce sont + +120 +00:00:39,880 --> 00:00:40,160 +les + +121 +00:00:40,160 --> 00:00:40,680 +conditions + +122 +00:00:40,680 --> 00:00:40,960 +qui + +123 +00:00:40,960 --> 00:00:41,460 +permettent + +124 +00:00:41,460 --> 00:00:41,600 +de + +125 +00:00:41,600 --> 00:00:42,060 +créer + +126 +00:00:42,060 --> 00:00:42,380 +cet + +127 +00:00:42,380 --> 00:00:42,600 +objet + +128 +00:00:42,600 --> 00:00:42,800 +dont + +129 +00:00:42,800 --> 00:00:43,260 +Nicolas + +130 +00:00:43,260 --> 00:00:43,500 +dit + +131 +00:00:43,500 --> 00:00:43,700 +qu'il + +132 +00:00:43,700 --> 00:00:43,880 +est + +133 +00:00:43,880 --> 00:00:44,980 +vraisemblablement + +134 +00:00:44,980 --> 00:00:45,380 +inédit + +135 +00:00:45,380 --> 00:00:45,700 +dans + +136 +00:00:45,700 --> 00:00:45,980 +l'histoire + +137 +00:00:45,980 --> 00:00:46,180 +de + +138 +00:00:46,180 --> 00:00:46,580 +l'humanité. + +139 +00:00:46,600 --> 00:00:47,240 +Mais + +140 +00:00:47,240 --> 00:00:47,720 +ça, + +141 +00:00:47,720 --> 00:00:47,840 +ça soulève + +142 +00:00:47,840 --> 00:00:48,020 +une + +143 +00:00:48,020 --> 00:00:48,260 +autre + +144 +00:00:48,260 --> 00:00:48,820 +interrogation. + +145 +00:00:49,220 --> 00:00:49,620 +Est-ce + +146 +00:00:49,620 --> 00:00:49,820 +que le + +147 +00:00:49,820 --> 00:00:49,980 +fait + +148 +00:00:49,980 --> 00:00:50,140 +que + +149 +00:00:50,140 --> 00:00:50,320 +cet + +150 +00:00:50,320 --> 00:00:50,660 +objet + +151 +00:00:50,660 --> 00:00:51,120 +soit + +152 +00:00:51,120 --> 00:00:51,800 +inédit + +153 +00:00:51,800 --> 00:00:52,320 +induit + +154 +00:00:52,320 --> 00:00:52,420 +que + +155 +00:00:52,420 --> 00:00:52,720 +notre + +156 +00:00:52,720 --> 00:00:53,280 +rapport + +157 +00:00:53,280 --> 00:00:53,660 +à lui + +158 +00:00:53,660 --> 00:00:54,020 +est + +159 +00:00:54,020 --> 00:00:54,540 +aussi + +160 +00:00:54,540 --> 00:00:54,700 +un + +161 +00:00:54,700 --> 00:00:55,000 +rapport + +162 +00:00:55,000 --> 00:00:55,460 +inédit? + +163 +00:00:55,460 --> 00:00:55,900 +Je + +164 +00:00:55,900 --> 00:00:56,000 +veux + +165 +00:00:56,000 --> 00:00:56,240 +dire, + +166 +00:00:56,240 --> 00:00:56,360 +est-ce + +167 +00:00:56,360 --> 00:00:56,580 +que le + +168 +00:00:56,580 --> 00:00:56,880 +rapport + +169 +00:00:56,880 --> 00:00:57,040 +qu'on + +170 +00:00:57,040 --> 00:00:57,280 +a au + +171 +00:00:57,280 --> 00:00:57,600 +smartphone + +172 +00:00:57,600 --> 00:00:57,920 +est + +173 +00:00:57,920 --> 00:00:58,240 +comparable + +174 +00:00:58,240 --> 00:00:58,480 +à + +175 +00:00:58,480 --> 00:00:58,660 +celui + +176 +00:00:58,660 --> 00:00:58,900 +qu'on + +177 +00:00:58,900 --> 00:00:59,320 +entretenait + +178 +00:00:59,320 --> 00:00:59,460 +à + +179 +00:00:59,460 --> 00:00:59,700 +d'autres + +180 +00:00:59,700 --> 00:00:59,960 +objets + +181 +00:00:59,960 --> 00:01:00,460 +techniques + +182 +00:01:00,460 --> 00:01:00,880 +comme + +183 +00:01:00,880 --> 00:01:01,500 +la + +184 +00:01:01,500 --> 00:01:02,060 +voiture + +185 +00:01:02,060 --> 00:01:02,680 +ou le + +186 +00:01:02,680 --> 00:01:03,120 +téléphone? + +187 +00:01:03,360 --> 00:01:05,480 +Il n'y + +188 +00:01:05,480 --> 00:01:05,660 +a pas + +189 +00:01:05,660 --> 00:01:06,220 +d'équivalent + +190 +00:01:06,220 --> 00:01:06,420 +en + +191 +00:01:06,420 --> 00:01:06,660 +fait. + +192 +00:01:06,880 --> 00:01:06,980 +Et + +193 +00:01:06,980 --> 00:01:07,080 +donc + +194 +00:01:07,080 --> 00:01:07,280 +cette + +195 +00:01:07,280 --> 00:01:07,540 +espèce + +196 +00:01:07,540 --> 00:01:07,680 +de + +197 +00:01:07,680 --> 00:01:08,480 +nouveauté + +198 +00:01:08,480 --> 00:01:08,660 +dans + +199 +00:01:08,660 --> 00:01:08,940 +la + +200 +00:01:08,940 --> 00:01:09,220 +relation + +201 +00:01:09,220 --> 00:01:09,380 +à + +202 +00:01:09,380 --> 00:01:10,240 +l'objet, + +203 +00:01:10,240 --> 00:01:10,380 +c'est + +204 +00:01:10,380 --> 00:01:10,640 +fascinant + +205 +00:01:10,640 --> 00:01:10,760 +et + +206 +00:01:10,760 --> 00:01:11,520 +terrifiant. + +207 +00:01:11,620 --> 00:01:11,860 +Parce + +208 +00:01:11,860 --> 00:01:12,120 +qu'on + +209 +00:01:12,120 --> 00:01:12,440 +a + +210 +00:01:12,440 --> 00:01:13,560 +l'impression, + +211 +00:01:13,560 --> 00:01:13,840 +comme + +212 +00:01:13,840 --> 00:01:14,000 +le + +213 +00:01:14,000 --> 00:01:14,200 +disent + +214 +00:01:14,200 --> 00:01:14,400 +les + +215 +00:01:14,400 --> 00:01:14,840 +utilisateurs + +216 +00:01:14,840 --> 00:01:15,000 +et les + +217 +00:01:15,000 --> 00:01:15,220 +services, + +218 +00:01:15,220 --> 00:01:15,420 +d'être + +219 +00:01:15,420 --> 00:01:15,960 +dépendants + +220 +00:01:15,960 --> 00:01:16,260 +de cet + +221 +00:01:16,260 --> 00:01:16,480 +objet, + +222 +00:01:16,860 --> 00:01:17,080 +d'induire + +223 +00:01:17,080 --> 00:01:17,240 +en + +224 +00:01:17,240 --> 00:01:17,340 +fait + +225 +00:01:17,340 --> 00:01:17,520 +une + +226 +00:01:17,520 --> 00:01:17,880 +espèce + +227 +00:01:17,880 --> 00:01:18,480 +de + +228 +00:01:18,480 --> 00:01:18,600 +relation, + +229 +00:01:18,600 --> 00:01:18,940 +de + +230 +00:01:18,940 --> 00:01:19,520 +médiation + +231 +00:01:19,520 --> 00:01:19,740 +avec + +232 +00:01:19,740 --> 00:01:19,920 +le + +233 +00:01:19,920 --> 00:01:20,640 +monde + +234 +00:01:20,640 --> 00:01:21,100 +qui + +235 +00:01:21,100 --> 00:01:21,640 +rend + +236 +00:01:21,640 --> 00:01:21,780 +de + +237 +00:01:21,780 --> 00:01:22,020 +l'ampleur + +238 +00:01:22,020 --> 00:01:22,240 +et qui + +239 +00:01:22,240 --> 00:01:22,360 +amène + +240 +00:01:22,360 --> 00:01:22,560 +aussi + +241 +00:01:22,560 --> 00:01:22,720 +à des + +242 +00:01:22,720 --> 00:01:22,900 +formes + +243 +00:01:22,900 --> 00:01:23,020 +de + +244 +00:01:23,020 --> 00:01:23,260 +rejet. + +245 +00:01:23,940 --> 00:01:24,940 +Donc, + +246 +00:01:24,940 --> 00:01:24,980 +à + +247 +00:01:24,980 --> 00:01:25,360 +objet + +248 +00:01:25,360 --> 00:01:26,560 +inédit, + +249 +00:01:26,560 --> 00:01:27,000 +rapport + +250 +00:01:27,000 --> 00:01:27,800 +inédit. + +251 +00:01:28,020 --> 00:01:28,860 +Et ce + +252 +00:01:28,860 --> 00:01:29,280 +rapport, + +253 +00:01:29,280 --> 00:01:29,560 +si + +254 +00:01:29,560 --> 00:01:29,840 +j'en + +255 +00:01:29,840 --> 00:01:29,880 +crois + +256 +00:01:29,880 --> 00:01:30,540 +Nicolas, + +257 +00:01:30,540 --> 00:01:30,940 +serait + +258 +00:01:30,940 --> 00:01:31,800 +caractérisé + +259 +00:01:31,800 --> 00:01:32,440 +par un + +260 +00:01:32,440 --> 00:01:32,980 +mélange + +261 +00:01:32,980 --> 00:01:33,400 +de + +262 +00:01:33,400 --> 00:01:34,240 +dépendance + +263 +00:01:34,240 --> 00:01:34,680 +et de + +264 +00:01:34,680 --> 00:01:35,140 +rejet. + +265 +00:01:35,780 --> 00:01:36,380 +Bon, + +266 +00:01:36,380 --> 00:01:36,520 +en + +267 +00:01:36,520 --> 00:01:37,140 +vrai, + +268 +00:01:37,140 --> 00:01:37,180 +il + +269 +00:01:37,180 --> 00:01:37,580 +faudrait + +270 +00:01:37,580 --> 00:01:38,080 +remonter + +271 +00:01:38,080 --> 00:01:38,580 +très + +272 +00:01:38,580 --> 00:01:38,700 +très + +273 +00:01:38,700 --> 00:01:39,320 +finement + +274 +00:01:39,320 --> 00:01:39,700 +toute + +275 +00:01:39,700 --> 00:01:40,060 +l'histoire + +276 +00:01:40,060 --> 00:01:40,240 +des + +277 +00:01:40,240 --> 00:01:40,480 +objets + +278 +00:01:40,480 --> 00:01:41,020 +techniques + +279 +00:01:41,020 --> 00:01:41,680 +et de + +280 +00:01:41,680 --> 00:01:41,840 +leur + +281 +00:01:41,840 --> 00:01:42,320 +insertion + +282 +00:01:42,320 --> 00:01:42,480 +dans + +283 +00:01:42,480 --> 00:01:42,660 +nos + +284 +00:01:42,660 --> 00:01:42,860 +vies + +285 +00:01:42,900 --> 00:01:43,060 +pour + +286 +00:01:43,060 --> 00:01:43,660 +déterminer + +287 +00:01:43,660 --> 00:01:43,940 +si ce + +288 +00:01:43,940 --> 00:01:44,260 +rapport + +289 +00:01:44,260 --> 00:01:44,740 +est + +290 +00:01:44,740 --> 00:01:45,300 +totalement + +291 +00:01:45,300 --> 00:01:45,740 +inédit. + +292 +00:01:46,100 --> 00:01:46,360 +Mais + +293 +00:01:46,360 --> 00:01:46,920 +j'ai + +294 +00:01:46,920 --> 00:01:47,360 +l'impression + +295 +00:01:47,360 --> 00:01:47,560 +comme + +296 +00:01:47,560 --> 00:01:47,960 +ça que + +297 +00:01:47,960 --> 00:01:48,460 +Nicolas + +298 +00:01:48,460 --> 00:01:48,700 +ne se + +299 +00:01:48,700 --> 00:01:48,880 +trompe + +300 +00:01:48,880 --> 00:01:49,080 +pas + +301 +00:01:49,080 --> 00:01:49,340 +vraiment. + +302 +00:01:49,880 --> 00:01:50,080 +Pour + +303 +00:01:50,080 --> 00:01:50,240 +autant + +304 +00:01:50,240 --> 00:01:50,520 +que je + +305 +00:01:50,520 --> 00:01:51,140 +sache, + +306 +00:01:51,140 --> 00:01:51,360 +il y a + +307 +00:01:51,360 --> 00:01:51,680 +eu + +308 +00:01:51,680 --> 00:01:51,880 +plein + +309 +00:01:51,880 --> 00:01:52,060 +de + +310 +00:01:52,060 --> 00:01:52,600 +discussions + +311 +00:01:52,600 --> 00:01:52,940 +autour + +312 +00:01:52,940 --> 00:01:53,520 +de la + +313 +00:01:53,520 --> 00:01:53,860 +voiture + +314 +00:01:53,860 --> 00:01:54,060 +ou + +315 +00:01:54,060 --> 00:01:54,440 +même + +316 +00:01:54,440 --> 00:01:54,600 +du + +317 +00:01:54,600 --> 00:01:54,980 +téléphone. + +318 +00:01:55,340 --> 00:01:55,720 +Mais + +319 +00:01:55,720 --> 00:01:56,020 +la + +320 +00:01:56,020 --> 00:01:56,400 +dépendance + +321 +00:01:56,400 --> 00:01:56,620 +n'était + +322 +00:01:56,620 --> 00:01:57,160 +pas du + +323 +00:01:57,160 --> 00:01:57,460 +même + +324 +00:01:57,460 --> 00:01:57,780 +ordre. + +325 +00:01:57,780 --> 00:01:57,980 +Donc + +326 +00:01:57,980 --> 00:01:58,340 +le + +327 +00:01:58,340 --> 00:01:58,620 +rejet + +328 +00:01:58,620 --> 00:01:58,780 +non + +329 +00:01:58,780 --> 00:01:58,940 +plus + +330 +00:01:58,940 --> 00:01:59,120 +n'était + +331 +00:01:59,120 --> 00:01:59,380 +pas du + +332 +00:01:59,380 --> 00:01:59,560 +même + +333 +00:01:59,560 --> 00:01:59,840 +ordre. + +334 +00:01:59,980 --> 00:02:00,180 +On + +335 +00:02:00,180 --> 00:02:00,380 +peut + +336 +00:02:00,380 --> 00:02:00,660 +adorer + +337 +00:02:00,660 --> 00:02:00,880 +sa + +338 +00:02:00,880 --> 00:02:01,460 +bagnole, + +339 +00:02:01,460 --> 00:02:01,560 +en + +340 +00:02:01,560 --> 00:02:01,740 +avoir + +341 +00:02:01,740 --> 00:02:02,100 +besoin + +342 +00:02:02,100 --> 00:02:02,340 +pour + +343 +00:02:02,340 --> 00:02:02,680 +plein + +344 +00:02:02,680 --> 00:02:02,800 +de + +345 +00:02:02,800 --> 00:02:03,020 +choses. + +346 +00:02:03,280 --> 00:02:03,460 +Et + +347 +00:02:03,460 --> 00:02:03,860 +bien, + +348 +00:02:03,860 --> 00:02:03,980 +le + +349 +00:02:03,980 --> 00:02:04,680 +soir, + +350 +00:02:04,680 --> 00:02:04,900 +quand + +351 +00:02:04,900 --> 00:02:05,140 +on va + +352 +00:02:05,140 --> 00:02:05,380 +se + +353 +00:02:05,380 --> 00:02:05,800 +coucher, + +354 +00:02:05,800 --> 00:02:06,220 +on la + +355 +00:02:06,220 --> 00:02:06,360 +laisse. + +356 +00:02:06,980 --> 00:02:07,360 +On ne + +357 +00:02:07,360 --> 00:02:07,480 +l'a + +358 +00:02:07,480 --> 00:02:07,680 +pas + +359 +00:02:07,680 --> 00:02:07,800 +dans + +360 +00:02:07,800 --> 00:02:08,060 +la + +361 +00:02:08,060 --> 00:02:08,260 +main + +362 +00:02:08,260 --> 00:02:08,440 +quand + +363 +00:02:08,440 --> 00:02:08,680 +on est + +364 +00:02:08,680 --> 00:02:09,040 +au + +365 +00:02:09,040 --> 00:02:09,140 +lit, + +366 +00:02:09,140 --> 00:02:09,300 +on ne + +367 +00:02:09,300 --> 00:02:09,500 +l'emmène + +368 +00:02:09,500 --> 00:02:09,860 +pas au + +369 +00:02:09,860 --> 00:02:10,480 +chiottes. + +370 +00:02:10,860 --> 00:02:11,040 +On + +371 +00:02:11,040 --> 00:02:11,280 +pouvait + +372 +00:02:11,280 --> 00:02:11,480 +être + +373 +00:02:11,480 --> 00:02:12,220 +énervé + +374 +00:02:12,220 --> 00:02:12,440 +par + +375 +00:02:12,440 --> 00:02:12,700 +son + +376 +00:02:12,700 --> 00:02:13,100 +môme + +377 +00:02:13,100 --> 00:02:13,340 +qui + +378 +00:02:13,340 --> 00:02:13,760 +occupait + +379 +00:02:13,760 --> 00:02:13,800 +la + +380 +00:02:13,800 --> 00:02:14,080 +ligne + +381 +00:02:14,080 --> 00:02:14,140 +de + +382 +00:02:14,140 --> 00:02:14,600 +téléphone + +383 +00:02:14,600 --> 00:02:14,820 +pendant + +384 +00:02:14,820 --> 00:02:15,200 +une + +385 +00:02:15,200 --> 00:02:15,360 +heure + +386 +00:02:15,360 --> 00:02:15,540 +chaque + +387 +00:02:15,540 --> 00:02:15,800 +soir + +388 +00:02:15,800 --> 00:02:15,960 +pour + +389 +00:02:15,960 --> 00:02:16,280 +discuter + +390 +00:02:16,280 --> 00:02:16,480 +avec + +391 +00:02:16,480 --> 00:02:16,600 +un + +392 +00:02:16,600 --> 00:02:16,900 +copain. + +393 +00:02:17,280 --> 00:02:17,460 +Mais + +394 +00:02:17,460 --> 00:02:17,940 +ça ne + +395 +00:02:17,940 --> 00:02:18,400 +ressemblait + +396 +00:02:18,400 --> 00:02:18,940 +pas à + +397 +00:02:18,940 --> 00:02:18,980 +ce + +398 +00:02:18,980 --> 00:02:19,100 +qu'on + +399 +00:02:19,100 --> 00:02:19,480 +peut + +400 +00:02:19,480 --> 00:02:20,120 +ressentir + +401 +00:02:20,120 --> 00:02:20,460 +à voir + +402 +00:02:20,460 --> 00:02:20,680 +ce + +403 +00:02:20,680 --> 00:02:20,920 +même + +404 +00:02:20,920 --> 00:02:21,340 +môme + +405 +00:02:21,340 --> 00:02:21,880 +aujourd'hui, + +406 +00:02:22,140 --> 00:02:22,940 +continuellement + +407 +00:02:22,940 --> 00:02:23,180 +avec + +408 +00:02:23,180 --> 00:02:23,380 +son + +409 +00:02:23,380 --> 00:02:23,760 +smartphone + +410 +00:02:23,760 --> 00:02:23,940 +dans + +411 +00:02:23,940 --> 00:02:24,000 +la + +412 +00:02:24,000 --> 00:02:24,360 +main, + +413 +00:02:24,360 --> 00:02:24,520 +comme + +414 +00:02:24,520 --> 00:02:24,640 +si + +415 +00:02:24,640 --> 00:02:24,820 +c'était + +416 +00:02:24,820 --> 00:02:25,060 +une + +417 +00:02:25,060 --> 00:02:25,220 +sorte + +418 +00:02:25,220 --> 00:02:25,300 +de + +419 +00:02:25,300 --> 00:02:25,820 +pacemaker + +420 +00:02:25,820 --> 00:02:26,300 +externe, + +421 +00:02:26,340 --> 00:02:26,580 +comme + +422 +00:02:26,580 --> 00:02:26,860 +si le + +423 +00:02:26,860 --> 00:02:27,360 +lâcher + +424 +00:02:27,360 --> 00:02:27,560 +allait + +425 +00:02:27,560 --> 00:02:27,860 +entraîner + +426 +00:02:27,860 --> 00:02:28,000 +sa + +427 +00:02:28,000 --> 00:02:28,220 +mort + +428 +00:02:28,220 --> 00:02:28,840 +immédiate. + +429 +00:02:29,040 --> 00:02:29,280 +Bon, + +430 +00:02:29,280 --> 00:02:29,460 +je dis + +431 +00:02:29,460 --> 00:02:29,640 +ça + +432 +00:02:29,640 --> 00:02:29,740 +pour + +433 +00:02:29,740 --> 00:02:29,880 +le + +434 +00:02:29,880 --> 00:02:30,320 +môme, + +435 +00:02:30,320 --> 00:02:30,520 +mais + +436 +00:02:30,520 --> 00:02:30,820 +c'est + +437 +00:02:30,820 --> 00:02:31,140 +évidemment + +438 +00:02:31,140 --> 00:02:31,480 +valable + +439 +00:02:31,480 --> 00:02:31,620 +pour + +440 +00:02:31,620 --> 00:02:31,760 +nous + +441 +00:02:31,760 --> 00:02:31,960 +aussi. + +442 +00:02:32,340 --> 00:02:33,460 +Donc, + +443 +00:02:33,460 --> 00:02:33,660 +rapport + +444 +00:02:33,660 --> 00:02:34,240 +inédit. + +445 +00:02:34,240 --> 00:02:35,480 +D'accord. + +446 +00:02:35,480 --> 00:02:35,820 +Mais + +447 +00:02:35,820 --> 00:02:36,320 +pourquoi + +448 +00:02:36,320 --> 00:02:36,680 +a-t-on + +449 +00:02:36,680 --> 00:02:37,060 +l'impression + +450 +00:02:37,060 --> 00:02:37,260 +qu'on + +451 +00:02:37,260 --> 00:02:37,440 +n'en + +452 +00:02:37,440 --> 00:02:37,900 +sortira + +453 +00:02:37,900 --> 00:02:38,220 +jamais? + +454 +00:02:38,860 --> 00:02:39,340 +Est-ce + +455 +00:02:39,340 --> 00:02:39,460 +qu'il + +456 +00:02:39,460 --> 00:02:39,620 +faut + +457 +00:02:39,620 --> 00:02:39,780 +en + +458 +00:02:39,780 --> 00:02:40,120 +remettre + +459 +00:02:40,120 --> 00:02:40,340 +la + +460 +00:02:40,340 --> 00:02:40,660 +faute + +461 +00:02:40,660 --> 00:02:40,940 +sur + +462 +00:02:40,940 --> 00:02:41,280 +les + +463 +00:02:41,280 --> 00:02:41,440 +gens + +464 +00:02:41,440 --> 00:02:41,580 +qui + +465 +00:02:41,580 --> 00:02:41,720 +ont + +466 +00:02:41,720 --> 00:02:42,300 +créé + +467 +00:02:42,300 --> 00:02:42,460 +cet + +468 +00:02:42,460 --> 00:02:42,780 +outil + +469 +00:02:42,780 --> 00:02:43,340 +merveilleux + +470 +00:02:43,340 --> 00:02:43,500 +et + +471 +00:02:43,500 --> 00:02:43,860 +diabolique, + +472 +00:02:43,860 --> 00:02:43,920 +et + +473 +00:02:43,920 --> 00:02:44,400 +diabolique + +474 +00:02:44,400 --> 00:02:44,660 +parce + +475 +00:02:44,660 --> 00:02:44,840 +que + +476 +00:02:44,840 --> 00:02:45,320 +merveilleux? + +477 +00:02:46,340 --> 00:02:47,040 +Les + +478 +00:02:47,040 --> 00:02:47,480 +économistes + +479 +00:02:47,480 --> 00:02:47,680 +parlent + +480 +00:02:47,680 --> 00:02:47,820 +de + +481 +00:02:47,820 --> 00:02:48,360 +dépendance + +482 +00:02:48,360 --> 00:02:48,500 +du + +483 +00:02:48,500 --> 00:02:48,820 +sentier. + +484 +00:02:48,860 --> 00:02:49,100 +C'est + +485 +00:02:49,100 --> 00:02:49,340 +l'idée + +486 +00:02:49,340 --> 00:02:49,700 +qu'on + +487 +00:02:49,700 --> 00:02:49,880 +est + +488 +00:02:49,880 --> 00:02:50,540 +sur un + +489 +00:02:50,540 --> 00:02:50,780 +sentier + +490 +00:02:50,780 --> 00:02:50,940 +qui a + +491 +00:02:50,940 --> 00:02:51,120 +été + +492 +00:02:51,120 --> 00:02:51,900 +établi, + +493 +00:02:51,900 --> 00:02:52,120 +soit + +494 +00:02:52,120 --> 00:02:52,720 +volontairement + +495 +00:02:52,720 --> 00:02:52,800 +en + +496 +00:02:52,800 --> 00:02:53,060 +marchant + +497 +00:02:53,060 --> 00:02:54,240 +dessus, + +498 +00:02:54,240 --> 00:02:54,920 +soit + +499 +00:02:54,920 --> 00:02:55,360 +en + +500 +00:02:55,360 --> 00:02:55,500 +définissant + +501 +00:02:55,500 --> 00:02:55,760 +des + +502 +00:02:55,760 --> 00:02:56,040 +bornes, + +503 +00:02:56,040 --> 00:02:56,080 +en + +504 +00:02:56,080 --> 00:02:56,580 +définissant + +505 +00:02:56,580 --> 00:02:56,820 +une + +506 +00:02:56,820 --> 00:02:57,420 +signalétique. + diff --git a/tests/expected/split_subtitles/smartphone.mp3_6.vtt b/tests/expected/split_subtitles/smartphone.mp3_6.vtt new file mode 100644 index 0000000000000000000000000000000000000000..61871c111372405e0b3331b5d11e0e1cbd3f450e --- /dev/null +++ b/tests/expected/split_subtitles/smartphone.mp3_6.vtt @@ -0,0 +1,1520 @@ +WEBVTT + +00:00.380 --> 00:00.580 +C'est + +00:00.580 --> 00:00.880 +évident + +00:00.880 --> 00:01.080 +ce que + +00:01.080 --> 00:01.200 +dit + +00:01.200 --> 00:01.780 +Nicolas, + +00:01.780 --> 00:01.900 +mais + +00:01.900 --> 00:02.340 +je ne + +00:02.340 --> 00:02.380 +me + +00:02.380 --> 00:02.580 +l'étais + +00:02.580 --> 00:02.840 +jamais + +00:02.840 --> 00:03.260 +formulé + +00:03.260 --> 00:03.420 +comme + +00:03.420 --> 00:03.620 +ça. + +00:04.080 --> 00:04.340 +Ce qui + +00:04.340 --> 00:04.480 +fait + +00:04.480 --> 00:04.660 +la + +00:04.660 --> 00:05.000 +force + +00:05.000 --> 00:05.200 +du + +00:05.200 --> 00:05.880 +smartphone, + +00:05.880 --> 00:06.120 +c'est + +00:06.120 --> 00:06.260 +pas + +00:06.260 --> 00:06.520 +seulement + +00:06.520 --> 00:07.380 +l'accumulation + +00:07.380 --> 00:07.560 +des + +00:07.560 --> 00:07.920 +fonctions, + +00:08.320 --> 00:08.440 +mais + +00:08.440 --> 00:08.600 +la + +00:08.600 --> 00:08.900 +manière + +00:08.900 --> 00:09.100 +dont + +00:09.100 --> 00:09.480 +elles + +00:09.480 --> 00:10.320 +interagissent + +00:10.320 --> 00:10.580 +entre + +00:10.580 --> 00:10.880 +elles. + +00:10.960 --> 00:11.220 +Ce qui + +00:11.220 --> 00:11.400 +dit + +00:11.400 --> 00:11.560 +d'ailleurs + +00:11.560 --> 00:11.780 +sur la + +00:11.780 --> 00:12.120 +photo, + +00:12.120 --> 00:12.200 +c'est + +00:12.200 --> 00:12.420 +hyper + +00:12.420 --> 00:13.000 +convaincant. + +00:13.340 --> 00:13.620 +Alors + +00:13.620 --> 00:14.340 +évidemment, + +00:14.340 --> 00:14.380 +il + +00:14.380 --> 00:14.740 +faudrait + +00:14.740 --> 00:15.160 +ajouter + +00:15.160 --> 00:15.520 +les + +00:15.520 --> 00:16.020 +interfaces. + +00:16.220 --> 00:16.700 +L'écran + +00:16.700 --> 00:17.060 +tactile + +00:17.060 --> 00:17.880 +a été + +00:17.880 --> 00:18.280 +beaucoup + +00:18.280 --> 00:18.620 +très + +00:18.620 --> 00:18.900 +souvent + +00:18.900 --> 00:19.360 +mentionné. + +00:19.840 --> 00:20.220 +Mais + +00:20.220 --> 00:20.520 +bon, + +00:20.520 --> 00:20.600 +il + +00:20.600 --> 00:20.700 +faut + +00:20.700 --> 00:20.840 +dire + +00:20.840 --> 00:20.960 +qu'il + +00:20.960 --> 00:21.260 +profite + +00:21.260 --> 00:21.680 +aussi + +00:21.680 --> 00:22.100 +de 20 + +00:22.100 --> 00:22.320 +ans + +00:22.320 --> 00:22.480 +pendant + +00:22.480 --> 00:22.920 +lesquels + +00:22.920 --> 00:23.040 +les + +00:23.040 --> 00:23.540 +ordinateurs + +00:23.540 --> 00:23.720 +nous + +00:23.720 --> 00:23.820 +ont + +00:23.820 --> 00:24.100 +appris + +00:24.100 --> 00:24.240 +à + +00:24.240 --> 00:24.500 +cliquer + +00:24.500 --> 00:24.660 +sur + +00:24.660 --> 00:24.940 +des + +00:24.940 --> 00:25.260 +icônes. + +00:25.420 --> 00:25.760 +Sauf + +00:25.760 --> 00:26.660 +que le + +00:26.660 --> 00:27.060 +smartphone + +00:27.060 --> 00:27.440 +ajoute + +00:27.440 --> 00:27.620 +le + +00:27.620 --> 00:28.180 +toucher, + +00:28.180 --> 00:28.280 +ce qui + +00:28.280 --> 00:28.480 +rend + +00:28.480 --> 00:28.680 +le + +00:28.680 --> 00:29.100 +contact + +00:29.100 --> 00:29.460 +plus + +00:29.460 --> 00:30.220 +direct, + +00:30.220 --> 00:30.260 +plus + +00:30.260 --> 00:30.640 +sensible. + +00:31.040 --> 00:31.220 +Et + +00:31.220 --> 00:31.360 +puis + +00:31.360 --> 00:31.700 +évidemment, + +00:31.700 --> 00:31.740 +il + +00:31.740 --> 00:31.940 +faudrait + +00:31.940 --> 00:32.120 +parler + +00:32.120 --> 00:32.340 +aussi + +00:32.340 --> 00:32.480 +des + +00:32.480 --> 00:32.900 +applications + +00:32.900 --> 00:33.180 +qui + +00:33.180 --> 00:33.740 +permettent + +00:33.740 --> 00:33.960 +de + +00:33.960 --> 00:34.420 +contourner + +00:34.420 --> 00:34.520 +le + +00:34.520 --> 00:34.800 +côté + +00:34.800 --> 00:35.320 +touffu + +00:35.320 --> 00:35.780 +de la + +00:35.780 --> 00:36.240 +navigation + +00:36.240 --> 00:36.600 +web + +00:36.600 --> 00:36.780 +pour + +00:36.780 --> 00:36.980 +aller + +00:36.980 --> 00:37.520 +directement + +00:37.520 --> 00:37.680 +au + +00:37.680 --> 00:37.820 +but. + +00:37.820 --> 00:38.760 +Bref, + +00:38.760 --> 00:38.980 +tout + +00:38.980 --> 00:39.420 +ça, + +00:39.420 --> 00:39.880 +ce sont + +00:39.880 --> 00:40.160 +les + +00:40.160 --> 00:40.680 +conditions + +00:40.680 --> 00:40.960 +qui + +00:40.960 --> 00:41.460 +permettent + +00:41.460 --> 00:41.600 +de + +00:41.600 --> 00:42.060 +créer + +00:42.060 --> 00:42.380 +cet + +00:42.380 --> 00:42.600 +objet + +00:42.600 --> 00:42.800 +dont + +00:42.800 --> 00:43.260 +Nicolas + +00:43.260 --> 00:43.500 +dit + +00:43.500 --> 00:43.700 +qu'il + +00:43.700 --> 00:43.880 +est + +00:43.880 --> 00:44.980 +vraisemblablement + +00:44.980 --> 00:45.380 +inédit + +00:45.380 --> 00:45.700 +dans + +00:45.700 --> 00:45.980 +l'histoire + +00:45.980 --> 00:46.180 +de + +00:46.180 --> 00:46.580 +l'humanité. + +00:46.600 --> 00:47.240 +Mais + +00:47.240 --> 00:47.720 +ça, + +00:47.720 --> 00:47.840 +ça soulève + +00:47.840 --> 00:48.020 +une + +00:48.020 --> 00:48.260 +autre + +00:48.260 --> 00:48.820 +interrogation. + +00:49.220 --> 00:49.620 +Est-ce + +00:49.620 --> 00:49.820 +que le + +00:49.820 --> 00:49.980 +fait + +00:49.980 --> 00:50.140 +que + +00:50.140 --> 00:50.320 +cet + +00:50.320 --> 00:50.660 +objet + +00:50.660 --> 00:51.120 +soit + +00:51.120 --> 00:51.800 +inédit + +00:51.800 --> 00:52.320 +induit + +00:52.320 --> 00:52.420 +que + +00:52.420 --> 00:52.720 +notre + +00:52.720 --> 00:53.280 +rapport + +00:53.280 --> 00:53.660 +à lui + +00:53.660 --> 00:54.020 +est + +00:54.020 --> 00:54.540 +aussi + +00:54.540 --> 00:54.700 +un + +00:54.700 --> 00:55.000 +rapport + +00:55.000 --> 00:55.460 +inédit? + +00:55.460 --> 00:55.900 +Je + +00:55.900 --> 00:56.000 +veux + +00:56.000 --> 00:56.240 +dire, + +00:56.240 --> 00:56.360 +est-ce + +00:56.360 --> 00:56.580 +que le + +00:56.580 --> 00:56.880 +rapport + +00:56.880 --> 00:57.040 +qu'on + +00:57.040 --> 00:57.280 +a au + +00:57.280 --> 00:57.600 +smartphone + +00:57.600 --> 00:57.920 +est + +00:57.920 --> 00:58.240 +comparable + +00:58.240 --> 00:58.480 +à + +00:58.480 --> 00:58.660 +celui + +00:58.660 --> 00:58.900 +qu'on + +00:58.900 --> 00:59.320 +entretenait + +00:59.320 --> 00:59.460 +à + +00:59.460 --> 00:59.700 +d'autres + +00:59.700 --> 00:59.960 +objets + +00:59.960 --> 01:00.460 +techniques + +01:00.460 --> 01:00.880 +comme + +01:00.880 --> 01:01.500 +la + +01:01.500 --> 01:02.060 +voiture + +01:02.060 --> 01:02.680 +ou le + +01:02.680 --> 01:03.120 +téléphone? + +01:03.360 --> 01:05.480 +Il n'y + +01:05.480 --> 01:05.660 +a pas + +01:05.660 --> 01:06.220 +d'équivalent + +01:06.220 --> 01:06.420 +en + +01:06.420 --> 01:06.660 +fait. + +01:06.880 --> 01:06.980 +Et + +01:06.980 --> 01:07.080 +donc + +01:07.080 --> 01:07.280 +cette + +01:07.280 --> 01:07.540 +espèce + +01:07.540 --> 01:07.680 +de + +01:07.680 --> 01:08.480 +nouveauté + +01:08.480 --> 01:08.660 +dans + +01:08.660 --> 01:08.940 +la + +01:08.940 --> 01:09.220 +relation + +01:09.220 --> 01:09.380 +à + +01:09.380 --> 01:10.240 +l'objet, + +01:10.240 --> 01:10.380 +c'est + +01:10.380 --> 01:10.640 +fascinant + +01:10.640 --> 01:10.760 +et + +01:10.760 --> 01:11.520 +terrifiant. + +01:11.620 --> 01:11.860 +Parce + +01:11.860 --> 01:12.120 +qu'on + +01:12.120 --> 01:12.440 +a + +01:12.440 --> 01:13.560 +l'impression, + +01:13.560 --> 01:13.840 +comme + +01:13.840 --> 01:14.000 +le + +01:14.000 --> 01:14.200 +disent + +01:14.200 --> 01:14.400 +les + +01:14.400 --> 01:14.840 +utilisateurs + +01:14.840 --> 01:15.000 +et les + +01:15.000 --> 01:15.220 +services, + +01:15.220 --> 01:15.420 +d'être + +01:15.420 --> 01:15.960 +dépendants + +01:15.960 --> 01:16.260 +de cet + +01:16.260 --> 01:16.480 +objet, + +01:16.860 --> 01:17.080 +d'induire + +01:17.080 --> 01:17.240 +en + +01:17.240 --> 01:17.340 +fait + +01:17.340 --> 01:17.520 +une + +01:17.520 --> 01:17.880 +espèce + +01:17.880 --> 01:18.480 +de + +01:18.480 --> 01:18.600 +relation, + +01:18.600 --> 01:18.940 +de + +01:18.940 --> 01:19.520 +médiation + +01:19.520 --> 01:19.740 +avec + +01:19.740 --> 01:19.920 +le + +01:19.920 --> 01:20.640 +monde + +01:20.640 --> 01:21.100 +qui + +01:21.100 --> 01:21.640 +rend + +01:21.640 --> 01:21.780 +de + +01:21.780 --> 01:22.020 +l'ampleur + +01:22.020 --> 01:22.240 +et qui + +01:22.240 --> 01:22.360 +amène + +01:22.360 --> 01:22.560 +aussi + +01:22.560 --> 01:22.720 +à des + +01:22.720 --> 01:22.900 +formes + +01:22.900 --> 01:23.020 +de + +01:23.020 --> 01:23.260 +rejet. + +01:23.940 --> 01:24.940 +Donc, + +01:24.940 --> 01:24.980 +à + +01:24.980 --> 01:25.360 +objet + +01:25.360 --> 01:26.560 +inédit, + +01:26.560 --> 01:27.000 +rapport + +01:27.000 --> 01:27.800 +inédit. + +01:28.020 --> 01:28.860 +Et ce + +01:28.860 --> 01:29.280 +rapport, + +01:29.280 --> 01:29.560 +si + +01:29.560 --> 01:29.840 +j'en + +01:29.840 --> 01:29.880 +crois + +01:29.880 --> 01:30.540 +Nicolas, + +01:30.540 --> 01:30.940 +serait + +01:30.940 --> 01:31.800 +caractérisé + +01:31.800 --> 01:32.440 +par un + +01:32.440 --> 01:32.980 +mélange + +01:32.980 --> 01:33.400 +de + +01:33.400 --> 01:34.240 +dépendance + +01:34.240 --> 01:34.680 +et de + +01:34.680 --> 01:35.140 +rejet. + +01:35.780 --> 01:36.380 +Bon, + +01:36.380 --> 01:36.520 +en + +01:36.520 --> 01:37.140 +vrai, + +01:37.140 --> 01:37.180 +il + +01:37.180 --> 01:37.580 +faudrait + +01:37.580 --> 01:38.080 +remonter + +01:38.080 --> 01:38.580 +très + +01:38.580 --> 01:38.700 +très + +01:38.700 --> 01:39.320 +finement + +01:39.320 --> 01:39.700 +toute + +01:39.700 --> 01:40.060 +l'histoire + +01:40.060 --> 01:40.240 +des + +01:40.240 --> 01:40.480 +objets + +01:40.480 --> 01:41.020 +techniques + +01:41.020 --> 01:41.680 +et de + +01:41.680 --> 01:41.840 +leur + +01:41.840 --> 01:42.320 +insertion + +01:42.320 --> 01:42.480 +dans + +01:42.480 --> 01:42.660 +nos + +01:42.660 --> 01:42.860 +vies + +01:42.900 --> 01:43.060 +pour + +01:43.060 --> 01:43.660 +déterminer + +01:43.660 --> 01:43.940 +si ce + +01:43.940 --> 01:44.260 +rapport + +01:44.260 --> 01:44.740 +est + +01:44.740 --> 01:45.300 +totalement + +01:45.300 --> 01:45.740 +inédit. + +01:46.100 --> 01:46.360 +Mais + +01:46.360 --> 01:46.920 +j'ai + +01:46.920 --> 01:47.360 +l'impression + +01:47.360 --> 01:47.560 +comme + +01:47.560 --> 01:47.960 +ça que + +01:47.960 --> 01:48.460 +Nicolas + +01:48.460 --> 01:48.700 +ne se + +01:48.700 --> 01:48.880 +trompe + +01:48.880 --> 01:49.080 +pas + +01:49.080 --> 01:49.340 +vraiment. + +01:49.880 --> 01:50.080 +Pour + +01:50.080 --> 01:50.240 +autant + +01:50.240 --> 01:50.520 +que je + +01:50.520 --> 01:51.140 +sache, + +01:51.140 --> 01:51.360 +il y a + +01:51.360 --> 01:51.680 +eu + +01:51.680 --> 01:51.880 +plein + +01:51.880 --> 01:52.060 +de + +01:52.060 --> 01:52.600 +discussions + +01:52.600 --> 01:52.940 +autour + +01:52.940 --> 01:53.520 +de la + +01:53.520 --> 01:53.860 +voiture + +01:53.860 --> 01:54.060 +ou + +01:54.060 --> 01:54.440 +même + +01:54.440 --> 01:54.600 +du + +01:54.600 --> 01:54.980 +téléphone. + +01:55.340 --> 01:55.720 +Mais + +01:55.720 --> 01:56.020 +la + +01:56.020 --> 01:56.400 +dépendance + +01:56.400 --> 01:56.620 +n'était + +01:56.620 --> 01:57.160 +pas du + +01:57.160 --> 01:57.460 +même + +01:57.460 --> 01:57.780 +ordre. + +01:57.780 --> 01:57.980 +Donc + +01:57.980 --> 01:58.340 +le + +01:58.340 --> 01:58.620 +rejet + +01:58.620 --> 01:58.780 +non + +01:58.780 --> 01:58.940 +plus + +01:58.940 --> 01:59.120 +n'était + +01:59.120 --> 01:59.380 +pas du + +01:59.380 --> 01:59.560 +même + +01:59.560 --> 01:59.840 +ordre. + +01:59.980 --> 02:00.180 +On + +02:00.180 --> 02:00.380 +peut + +02:00.380 --> 02:00.660 +adorer + +02:00.660 --> 02:00.880 +sa + +02:00.880 --> 02:01.460 +bagnole, + +02:01.460 --> 02:01.560 +en + +02:01.560 --> 02:01.740 +avoir + +02:01.740 --> 02:02.100 +besoin + +02:02.100 --> 02:02.340 +pour + +02:02.340 --> 02:02.680 +plein + +02:02.680 --> 02:02.800 +de + +02:02.800 --> 02:03.020 +choses. + +02:03.280 --> 02:03.460 +Et + +02:03.460 --> 02:03.860 +bien, + +02:03.860 --> 02:03.980 +le + +02:03.980 --> 02:04.680 +soir, + +02:04.680 --> 02:04.900 +quand + +02:04.900 --> 02:05.140 +on va + +02:05.140 --> 02:05.380 +se + +02:05.380 --> 02:05.800 +coucher, + +02:05.800 --> 02:06.220 +on la + +02:06.220 --> 02:06.360 +laisse. + +02:06.980 --> 02:07.360 +On ne + +02:07.360 --> 02:07.480 +l'a + +02:07.480 --> 02:07.680 +pas + +02:07.680 --> 02:07.800 +dans + +02:07.800 --> 02:08.060 +la + +02:08.060 --> 02:08.260 +main + +02:08.260 --> 02:08.440 +quand + +02:08.440 --> 02:08.680 +on est + +02:08.680 --> 02:09.040 +au + +02:09.040 --> 02:09.140 +lit, + +02:09.140 --> 02:09.300 +on ne + +02:09.300 --> 02:09.500 +l'emmène + +02:09.500 --> 02:09.860 +pas au + +02:09.860 --> 02:10.480 +chiottes. + +02:10.860 --> 02:11.040 +On + +02:11.040 --> 02:11.280 +pouvait + +02:11.280 --> 02:11.480 +être + +02:11.480 --> 02:12.220 +énervé + +02:12.220 --> 02:12.440 +par + +02:12.440 --> 02:12.700 +son + +02:12.700 --> 02:13.100 +môme + +02:13.100 --> 02:13.340 +qui + +02:13.340 --> 02:13.760 +occupait + +02:13.760 --> 02:13.800 +la + +02:13.800 --> 02:14.080 +ligne + +02:14.080 --> 02:14.140 +de + +02:14.140 --> 02:14.600 +téléphone + +02:14.600 --> 02:14.820 +pendant + +02:14.820 --> 02:15.200 +une + +02:15.200 --> 02:15.360 +heure + +02:15.360 --> 02:15.540 +chaque + +02:15.540 --> 02:15.800 +soir + +02:15.800 --> 02:15.960 +pour + +02:15.960 --> 02:16.280 +discuter + +02:16.280 --> 02:16.480 +avec + +02:16.480 --> 02:16.600 +un + +02:16.600 --> 02:16.900 +copain. + +02:17.280 --> 02:17.460 +Mais + +02:17.460 --> 02:17.940 +ça ne + +02:17.940 --> 02:18.400 +ressemblait + +02:18.400 --> 02:18.940 +pas à + +02:18.940 --> 02:18.980 +ce + +02:18.980 --> 02:19.100 +qu'on + +02:19.100 --> 02:19.480 +peut + +02:19.480 --> 02:20.120 +ressentir + +02:20.120 --> 02:20.460 +à voir + +02:20.460 --> 02:20.680 +ce + +02:20.680 --> 02:20.920 +même + +02:20.920 --> 02:21.340 +môme + +02:21.340 --> 02:21.880 +aujourd'hui, + +02:22.140 --> 02:22.940 +continuellement + +02:22.940 --> 02:23.180 +avec + +02:23.180 --> 02:23.380 +son + +02:23.380 --> 02:23.760 +smartphone + +02:23.760 --> 02:23.940 +dans + +02:23.940 --> 02:24.000 +la + +02:24.000 --> 02:24.360 +main, + +02:24.360 --> 02:24.520 +comme + +02:24.520 --> 02:24.640 +si + +02:24.640 --> 02:24.820 +c'était + +02:24.820 --> 02:25.060 +une + +02:25.060 --> 02:25.220 +sorte + +02:25.220 --> 02:25.300 +de + +02:25.300 --> 02:25.820 +pacemaker + +02:25.820 --> 02:26.300 +externe, + +02:26.340 --> 02:26.580 +comme + +02:26.580 --> 02:26.860 +si le + +02:26.860 --> 02:27.360 +lâcher + +02:27.360 --> 02:27.560 +allait + +02:27.560 --> 02:27.860 +entraîner + +02:27.860 --> 02:28.000 +sa + +02:28.000 --> 02:28.220 +mort + +02:28.220 --> 02:28.840 +immédiate. + +02:29.040 --> 02:29.280 +Bon, + +02:29.280 --> 02:29.460 +je dis + +02:29.460 --> 02:29.640 +ça + +02:29.640 --> 02:29.740 +pour + +02:29.740 --> 02:29.880 +le + +02:29.880 --> 02:30.320 +môme, + +02:30.320 --> 02:30.520 +mais + +02:30.520 --> 02:30.820 +c'est + +02:30.820 --> 02:31.140 +évidemment + +02:31.140 --> 02:31.480 +valable + +02:31.480 --> 02:31.620 +pour + +02:31.620 --> 02:31.760 +nous + +02:31.760 --> 02:31.960 +aussi. + +02:32.340 --> 02:33.460 +Donc, + +02:33.460 --> 02:33.660 +rapport + +02:33.660 --> 02:34.240 +inédit. + +02:34.240 --> 02:35.480 +D'accord. + +02:35.480 --> 02:35.820 +Mais + +02:35.820 --> 02:36.320 +pourquoi + +02:36.320 --> 02:36.680 +a-t-on + +02:36.680 --> 02:37.060 +l'impression + +02:37.060 --> 02:37.260 +qu'on + +02:37.260 --> 02:37.440 +n'en + +02:37.440 --> 02:37.900 +sortira + +02:37.900 --> 02:38.220 +jamais? + +02:38.860 --> 02:39.340 +Est-ce + +02:39.340 --> 02:39.460 +qu'il + +02:39.460 --> 02:39.620 +faut + +02:39.620 --> 02:39.780 +en + +02:39.780 --> 02:40.120 +remettre + +02:40.120 --> 02:40.340 +la + +02:40.340 --> 02:40.660 +faute + +02:40.660 --> 02:40.940 +sur + +02:40.940 --> 02:41.280 +les + +02:41.280 --> 02:41.440 +gens + +02:41.440 --> 02:41.580 +qui + +02:41.580 --> 02:41.720 +ont + +02:41.720 --> 02:42.300 +créé + +02:42.300 --> 02:42.460 +cet + +02:42.460 --> 02:42.780 +outil + +02:42.780 --> 02:43.340 +merveilleux + +02:43.340 --> 02:43.500 +et + +02:43.500 --> 02:43.860 +diabolique, + +02:43.860 --> 02:43.920 +et + +02:43.920 --> 02:44.400 +diabolique + +02:44.400 --> 02:44.660 +parce + +02:44.660 --> 02:44.840 +que + +02:44.840 --> 02:45.320 +merveilleux? + +02:46.340 --> 02:47.040 +Les + +02:47.040 --> 02:47.480 +économistes + +02:47.480 --> 02:47.680 +parlent + +02:47.680 --> 02:47.820 +de + +02:47.820 --> 02:48.360 +dépendance + +02:48.360 --> 02:48.500 +du + +02:48.500 --> 02:48.820 +sentier. + +02:48.860 --> 02:49.100 +C'est + +02:49.100 --> 02:49.340 +l'idée + +02:49.340 --> 02:49.700 +qu'on + +02:49.700 --> 02:49.880 +est + +02:49.880 --> 02:50.540 +sur un + +02:50.540 --> 02:50.780 +sentier + +02:50.780 --> 02:50.940 +qui a + +02:50.940 --> 02:51.120 +été + +02:51.120 --> 02:51.900 +établi, + +02:51.900 --> 02:52.120 +soit + +02:52.120 --> 02:52.720 +volontairement + +02:52.720 --> 02:52.800 +en + +02:52.800 --> 02:53.060 +marchant + +02:53.060 --> 02:54.240 +dessus, + +02:54.240 --> 02:54.920 +soit + +02:54.920 --> 02:55.360 +en + +02:55.360 --> 02:55.500 +définissant + +02:55.500 --> 02:55.760 +des + +02:55.760 --> 02:56.040 +bornes, + +02:56.040 --> 02:56.080 +en + +02:56.080 --> 02:56.580 +définissant + +02:56.580 --> 02:56.820 +une + +02:56.820 --> 02:57.420 +signalétique. + diff --git a/tests/expected/tiny.en.cpu/nocond_bonjour_vous_allez_bien.mp3.words.json b/tests/expected/tiny.en.cpu/nocond_bonjour_vous_allez_bien.mp3.words.json new file mode 100644 index 0000000000000000000000000000000000000000..be3e848ef767849ee49d451215e9eb018ec0f049 --- /dev/null +++ b/tests/expected/tiny.en.cpu/nocond_bonjour_vous_allez_bien.mp3.words.json @@ -0,0 +1,204 @@ +{ + "text": " Mohoo! Let's go with it again! Mohoo! Mohoo! Mohoo! Let's go with it again!", + "segments": [ + { + "id": 0, + "seek": 0, + "start": 0.44, + "end": 2.98, + "text": " Mohoo! Let's go with it again!", + "tokens": [ + 50363, + 337, + 1219, + 2238, + 0, + 3914, + 338, + 467, + 351, + 340, + 757, + 0, + 50513 + ], + "temperature": 0.0, + "avg_logprob": -0.8020243644714355, + "compression_ratio": 0.7894736842105263, + "no_speech_prob": 0.11818066984415054, + "confidence": 0.496, + "words": [ + { + "text": "Mohoo!", + "start": 0.44, + "end": 1.72, + "confidence": 0.271 + }, + { + "text": "Let's", + "start": 1.72, + "end": 2.04, + "confidence": 0.678 + }, + { + "text": "go", + "start": 2.04, + "end": 2.18, + "confidence": 0.914 + }, + { + "text": "with", + "start": 2.18, + "end": 2.38, + "confidence": 0.234 + }, + { + "text": "it", + "start": 2.38, + "end": 2.44, + "confidence": 0.933 + }, + { + "text": "again!", + "start": 2.44, + "end": 2.98, + "confidence": 0.996 + } + ] + }, + { + "id": 1, + "seek": 3000, + "start": 30.06, + "end": 31.25, + "text": " Mohoo!", + "tokens": [ + 337, + 1219, + 2238, + 0 + ], + "temperature": 0.0, + "avg_logprob": -0.8320662379264832, + "compression_ratio": 0.7894736842105263, + "no_speech_prob": 0.15341022610664368, + "confidence": 0.308, + "words": [ + { + "text": "Mohoo!", + "start": 30.06, + "end": 31.25, + "confidence": 0.308 + } + ] + }, + { + "id": 2, + "seek": 3100, + "start": 31.25, + "end": 32.48, + "text": " Mohoo!", + "tokens": [ + 337, + 1219, + 2238, + 0 + ], + "temperature": 0.0, + "avg_logprob": -0.767271101474762, + "compression_ratio": 0.7894736842105263, + "no_speech_prob": 0.1705959141254425, + "confidence": 0.329, + "words": [ + { + "text": "Mohoo!", + "start": 31.25, + "end": 32.48, + "confidence": 0.329 + } + ] + }, + { + "id": 3, + "seek": 3200, + "start": 32.98, + "end": 33.8, + "text": " Mohoo!", + "tokens": [ + 337, + 1219, + 2238, + 0 + ], + "temperature": 0.0, + "avg_logprob": -0.5514491200447083, + "compression_ratio": 0.7894736842105263, + "no_speech_prob": 0.1296440064907074, + "confidence": 0.338, + "words": [ + { + "text": "Mohoo!", + "start": 32.98, + "end": 33.8, + "confidence": 0.338 + } + ] + }, + { + "id": 4, + "seek": 3400, + "start": 34.4, + "end": 35.48, + "text": " Let's go with it again!", + "tokens": [ + 50363, + 3914, + 338, + 467, + 351, + 340, + 757, + 0, + 50463 + ], + "temperature": 0.0, + "avg_logprob": -0.3764993667602539, + "compression_ratio": 0.7419354838709677, + "no_speech_prob": 0.05320969223976135, + "confidence": 0.815, + "words": [ + { + "text": "Let's", + "start": 34.4, + "end": 34.58, + "confidence": 0.862 + }, + { + "text": "go", + "start": 34.58, + "end": 34.76, + "confidence": 0.923 + }, + { + "text": "with", + "start": 34.76, + "end": 34.96, + "confidence": 0.627 + }, + { + "text": "it", + "start": 34.96, + "end": 35.0, + "confidence": 0.686 + }, + { + "text": "again!", + "start": 35.0, + "end": 35.48, + "confidence": 0.992 + } + ] + } + ], + "language": "en" +} \ No newline at end of file diff --git a/tests/expected/tiny.en/accurate_bonjour_vous_allez_bien.mp3.words.json b/tests/expected/tiny.en/accurate_bonjour_vous_allez_bien.mp3.words.json new file mode 100644 index 0000000000000000000000000000000000000000..2e3ab6c3b9044538fc203c07d609c9cd0936f351 --- /dev/null +++ b/tests/expected/tiny.en/accurate_bonjour_vous_allez_bien.mp3.words.json @@ -0,0 +1,134 @@ +{ + "text": " Mohoo, let's go with it again Mohoo, let's go with it again", + "segments": [ + { + "id": 0, + "seek": 0, + "start": 0.42, + "end": 2.84, + "text": " Mohoo, let's go with it again", + "tokens": [ + 50363, + 337, + 1219, + 2238, + 11, + 1309, + 338, + 467, + 351, + 340, + 757, + 50501 + ], + "temperature": 0.0, + "avg_logprob": -0.7695202460655799, + "compression_ratio": 0.7837837837837838, + "no_speech_prob": 0.11803863942623138, + "confidence": 0.485, + "words": [ + { + "text": "Mohoo,", + "start": 0.42, + "end": 1.38, + "confidence": 0.245 + }, + { + "text": "let's", + "start": 1.92, + "end": 2.2, + "confidence": 0.91 + }, + { + "text": "go", + "start": 2.2, + "end": 2.3, + "confidence": 0.908 + }, + { + "text": "with", + "start": 2.3, + "end": 2.46, + "confidence": 0.286 + }, + { + "text": "it", + "start": 2.46, + "end": 2.56, + "confidence": 0.939 + }, + { + "text": "again", + "start": 2.56, + "end": 2.84, + "confidence": 0.997 + } + ] + }, + { + "id": 1, + "seek": 3000, + "start": 32.86, + "end": 35.42, + "text": " Mohoo, let's go with it again", + "tokens": [ + 50363, + 337, + 1219, + 2238, + 11, + 1309, + 338, + 467, + 351, + 340, + 757, + 50627 + ], + "temperature": 0.0, + "avg_logprob": -0.4126271101144644, + "compression_ratio": 0.7837837837837838, + "no_speech_prob": 0.34721481800079346, + "confidence": 0.544, + "words": [ + { + "text": "Mohoo,", + "start": 32.86, + "end": 34.02, + "confidence": 0.277 + }, + { + "text": "let's", + "start": 34.46, + "end": 34.74, + "confidence": 0.89 + }, + { + "text": "go", + "start": 34.74, + "end": 34.86, + "confidence": 0.935 + }, + { + "text": "with", + "start": 34.86, + "end": 34.98, + "confidence": 0.658 + }, + { + "text": "it", + "start": 34.98, + "end": 35.1, + "confidence": 0.79 + }, + { + "text": "again", + "start": 35.1, + "end": 35.42, + "confidence": 0.997 + } + ] + } + ], + "language": "en" +} \ No newline at end of file diff --git a/tests/expected/tiny.en/efficient_bonjour_vous_allez_bien.mp3.words.json b/tests/expected/tiny.en/efficient_bonjour_vous_allez_bien.mp3.words.json new file mode 100644 index 0000000000000000000000000000000000000000..fd22690c94ca48ebf75bd0ad7159776ca30f8161 --- /dev/null +++ b/tests/expected/tiny.en/efficient_bonjour_vous_allez_bien.mp3.words.json @@ -0,0 +1,136 @@ +{ + "text": " Mohoo! Let's go with it again! Mohoo! Let's go with it again!", + "segments": [ + { + "id": 0, + "seek": 0, + "start": 0.42, + "end": 2.8, + "text": " Mohoo! Let's go with it again!", + "tokens": [ + 50363, + 337, + 1219, + 2238, + 0, + 3914, + 338, + 467, + 351, + 340, + 757, + 0, + 50513 + ], + "temperature": 0.0, + "avg_logprob": -0.8020311764308384, + "compression_ratio": 0.7894736842105263, + "no_speech_prob": 0.11798259615898132, + "confidence": 0.496, + "words": [ + { + "text": "Mohoo!", + "start": 0.42, + "end": 1.36, + "confidence": 0.271 + }, + { + "text": "Let's", + "start": 1.9, + "end": 2.18, + "confidence": 0.677 + }, + { + "text": "go", + "start": 2.18, + "end": 2.32, + "confidence": 0.914 + }, + { + "text": "with", + "start": 2.32, + "end": 2.46, + "confidence": 0.233 + }, + { + "text": "it", + "start": 2.46, + "end": 2.56, + "confidence": 0.933 + }, + { + "text": "again!", + "start": 2.56, + "end": 2.8, + "confidence": 0.996 + } + ] + }, + { + "id": 1, + "seek": 3000, + "start": 32.98, + "end": 35.44, + "text": " Mohoo! Let's go with it again!", + "tokens": [ + 50363, + 337, + 1219, + 2238, + 0, + 3914, + 338, + 467, + 351, + 340, + 757, + 0, + 50663 + ], + "temperature": 0.0, + "avg_logprob": -0.1937453576496669, + "compression_ratio": 0.7894736842105263, + "no_speech_prob": 0.45197251439094543, + "confidence": 0.952, + "words": [ + { + "text": "Mohoo!", + "start": 32.98, + "end": 34.02, + "confidence": 0.896 + }, + { + "text": "Let's", + "start": 34.44, + "end": 34.72, + "confidence": 0.96 + }, + { + "text": "go", + "start": 34.72, + "end": 34.84, + "confidence": 0.99 + }, + { + "text": "with", + "start": 34.84, + "end": 35.0, + "confidence": 0.985 + }, + { + "text": "it", + "start": 35.0, + "end": 35.1, + "confidence": 0.991 + }, + { + "text": "again!", + "start": 35.1, + "end": 35.44, + "confidence": 0.998 + } + ] + } + ], + "language": "en" +} \ No newline at end of file diff --git a/tests/expected/tiny.en/nocond_bonjour_vous_allez_bien.mp3.words.json b/tests/expected/tiny.en/nocond_bonjour_vous_allez_bien.mp3.words.json new file mode 100644 index 0000000000000000000000000000000000000000..7e5c247abd49416c05ae5573819ef3e295747932 --- /dev/null +++ b/tests/expected/tiny.en/nocond_bonjour_vous_allez_bien.mp3.words.json @@ -0,0 +1,154 @@ +{ + "text": " Mohoo! Let's go with it again! Mohoo! Let's go with it again!", + "segments": [ + { + "id": 0, + "seek": 0, + "start": 0.42, + "end": 2.8, + "text": " Mohoo! Let's go with it again!", + "tokens": [ + 50363, + 337, + 1219, + 2238, + 0, + 3914, + 338, + 467, + 351, + 340, + 757, + 0, + 50513 + ], + "temperature": 0.0, + "avg_logprob": -0.8020311764308384, + "compression_ratio": 0.7894736842105263, + "no_speech_prob": 0.11798259615898132, + "confidence": 0.496, + "words": [ + { + "text": "Mohoo!", + "start": 0.42, + "end": 1.36, + "confidence": 0.271 + }, + { + "text": "Let's", + "start": 1.9, + "end": 2.18, + "confidence": 0.677 + }, + { + "text": "go", + "start": 2.18, + "end": 2.32, + "confidence": 0.914 + }, + { + "text": "with", + "start": 2.32, + "end": 2.46, + "confidence": 0.233 + }, + { + "text": "it", + "start": 2.46, + "end": 2.56, + "confidence": 0.933 + }, + { + "text": "again!", + "start": 2.56, + "end": 2.8, + "confidence": 0.996 + } + ] + }, + { + "id": 1, + "seek": 3000, + "start": 30.0, + "end": 30.06, + "text": " Mohoo!", + "tokens": [ + 50363, + 337, + 1219, + 2238, + 0, + 50413 + ], + "temperature": 0.0, + "avg_logprob": -0.8368260264396667, + "compression_ratio": 0.7894736842105263, + "no_speech_prob": 0.13588112592697144, + "confidence": 0.306, + "words": [ + { + "text": "Mohoo!", + "start": 30.0, + "end": 30.06, + "confidence": 0.306 + } + ] + }, + { + "id": 2, + "seek": 3000, + "start": 34.38, + "end": 35.36, + "text": " Let's go with it again!", + "tokens": [ + 50413, + 3914, + 338, + 467, + 351, + 340, + 757, + 0, + 50613 + ], + "temperature": 0.0, + "avg_logprob": -0.8368260264396667, + "compression_ratio": 0.7894736842105263, + "no_speech_prob": 0.13588112592697144, + "confidence": 0.847, + "words": [ + { + "text": "Let's", + "start": 34.38, + "end": 34.74, + "confidence": 0.876 + }, + { + "text": "go", + "start": 34.74, + "end": 34.86, + "confidence": 0.96 + }, + { + "text": "with", + "start": 34.86, + "end": 34.98, + "confidence": 0.619 + }, + { + "text": "it", + "start": 34.98, + "end": 35.1, + "confidence": 0.811 + }, + { + "text": "again!", + "start": 35.1, + "end": 35.36, + "confidence": 0.997 + } + ] + } + ], + "language": "en" +} \ No newline at end of file diff --git a/tests/expected/tiny_auto.cpu/gaenswein15.mp3.words.json b/tests/expected/tiny_auto.cpu/gaenswein15.mp3.words.json new file mode 100644 index 0000000000000000000000000000000000000000..2fa1b2d83ea55923062a1564d4750ee40a08e1b9 --- /dev/null +++ b/tests/expected/tiny_auto.cpu/gaenswein15.mp3.words.json @@ -0,0 +1,318 @@ +{ + "text": " Wie wieder zu dazu ist Meshfuchs von 1962 als Meshale für die außerordentliche Form des grullischen Rätos ist dann nicht so weitergegangen wie sich Papsbelle dick das gewünscht hatte. Das hat er als Meshale im Rätos.", + "segments": [ + { + "id": 0, + "seek": 0, + "start": 0.9, + "end": 12.76, + "text": " Wie wieder zu dazu ist Meshfuchs von 1962 als Meshale für die außerordentliche Form des grullischen Rätos ist dann nicht so weitergegangen wie sich Papsbelle dick das gewünscht hatte.", + "tokens": [ + 9233, + 6216, + 2164, + 13034, + 1418, + 376, + 14935, + 69, + 37503, + 2957, + 39498, + 3907, + 376, + 14935, + 1220, + 2959, + 978, + 39428, + 765, + 7698, + 68, + 10126, + 730, + 677, + 858, + 6282, + 497, + 3628, + 329, + 1418, + 3594, + 1979, + 370, + 8988, + 432, + 47152, + 3355, + 3041, + 430, + 2382, + 65, + 4434, + 18659, + 1482, + 6906, + 3412, + 82, + 4701, + 13299, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.6555103008563702, + "compression_ratio": 1.2619047619047619, + "no_speech_prob": 0.11051499098539352, + "confidence": 0.541, + "words": [ + { + "text": "Wie", + "start": 0.9, + "end": 1.06, + "confidence": 0.478 + }, + { + "text": "wieder", + "start": 1.06, + "end": 1.32, + "confidence": 0.901 + }, + { + "text": "zu", + "start": 1.32, + "end": 1.54, + "confidence": 0.249 + }, + { + "text": "dazu", + "start": 1.54, + "end": 1.86, + "confidence": 0.131 + }, + { + "text": "ist", + "start": 1.86, + "end": 2.12, + "confidence": 0.586 + }, + { + "text": "Meshfuchs", + "start": 2.12, + "end": 2.72, + "confidence": 0.332 + }, + { + "text": "von", + "start": 2.72, + "end": 2.94, + "confidence": 0.626 + }, + { + "text": "1962", + "start": 2.94, + "end": 4.72, + "confidence": 0.208 + }, + { + "text": "als", + "start": 4.72, + "end": 5.22, + "confidence": 0.885 + }, + { + "text": "Meshale", + "start": 5.22, + "end": 5.7, + "confidence": 0.385 + }, + { + "text": "für", + "start": 5.7, + "end": 5.9, + "confidence": 0.933 + }, + { + "text": "die", + "start": 5.9, + "end": 6.08, + "confidence": 0.972 + }, + { + "text": "außerordentliche", + "start": 6.08, + "end": 6.98, + "confidence": 0.899 + }, + { + "text": "Form", + "start": 6.98, + "end": 7.22, + "confidence": 0.655 + }, + { + "text": "des", + "start": 7.22, + "end": 7.58, + "confidence": 0.971 + }, + { + "text": "grullischen", + "start": 7.58, + "end": 8.04, + "confidence": 0.384 + }, + { + "text": "Rätos", + "start": 8.04, + "end": 8.58, + "confidence": 0.368 + }, + { + "text": "ist", + "start": 8.58, + "end": 9.6, + "confidence": 0.549 + }, + { + "text": "dann", + "start": 9.6, + "end": 9.74, + "confidence": 0.5 + }, + { + "text": "nicht", + "start": 9.74, + "end": 9.92, + "confidence": 0.936 + }, + { + "text": "so", + "start": 9.92, + "end": 10.08, + "confidence": 0.953 + }, + { + "text": "weitergegangen", + "start": 10.08, + "end": 10.86, + "confidence": 0.74 + }, + { + "text": "wie", + "start": 10.86, + "end": 11.04, + "confidence": 0.703 + }, + { + "text": "sich", + "start": 11.04, + "end": 11.22, + "confidence": 0.939 + }, + { + "text": "Papsbelle", + "start": 11.22, + "end": 11.62, + "confidence": 0.356 + }, + { + "text": "dick", + "start": 11.62, + "end": 11.84, + "confidence": 0.319 + }, + { + "text": "das", + "start": 11.84, + "end": 12.08, + "confidence": 0.844 + }, + { + "text": "gewünscht", + "start": 12.08, + "end": 12.48, + "confidence": 0.818 + }, + { + "text": "hatte.", + "start": 12.48, + "end": 12.76, + "confidence": 0.922 + } + ] + }, + { + "id": 1, + "seek": 1300, + "start": 13.98, + "end": 15.22, + "text": " Das hat er als Meshale im Rätos.", + "tokens": [ + 50364, + 2846, + 2385, + 1189, + 3907, + 376, + 14935, + 1220, + 566, + 497, + 3628, + 329, + 13, + 51314 + ], + "temperature": 0.0, + "avg_logprob": -0.9505692799886067, + "compression_ratio": 0.8048780487804879, + "no_speech_prob": 0.044665463268756866, + "confidence": 0.381, + "words": [ + { + "text": "Das", + "start": 13.98, + "end": 14.2, + "confidence": 0.841 + }, + { + "text": "hat", + "start": 14.2, + "end": 14.32, + "confidence": 0.878 + }, + { + "text": "er", + "start": 14.32, + "end": 14.46, + "confidence": 0.606 + }, + { + "text": "als", + "start": 14.46, + "end": 14.7, + "confidence": 0.626 + }, + { + "text": "Meshale", + "start": 14.7, + "end": 15.0, + "confidence": 0.206 + }, + { + "text": "im", + "start": 15.0, + "end": 15.04, + "confidence": 0.101 + }, + { + "text": "Rätos.", + "start": 15.04, + "end": 15.22, + "confidence": 0.464 + } + ] + } + ], + "language": "de" +} \ No newline at end of file diff --git a/tests/expected/tiny_auto.cpu/radio_short.mp3.words.json b/tests/expected/tiny_auto.cpu/radio_short.mp3.words.json new file mode 100644 index 0000000000000000000000000000000000000000..f2388cb2c74572247a52a55a46815f03a82a84a0 --- /dev/null +++ b/tests/expected/tiny_auto.cpu/radio_short.mp3.words.json @@ -0,0 +1,3786 @@ +{ + "text": " What are you telling me, guys? What are you telling me, dude? What are you telling me, dude? What are you telling me, dude? What are you telling me, guys? What are you telling me, guys? What are you telling me, dude? What are you telling me, dude? What are you telling me, dude? What are you telling me, dude? What are you telling me, dude? What are you telling me, dude? What are you telling me, dude? What are you telling me, dude? What are you telling me, dude? What are you telling me, dude? What are you telling me, dude? What are you telling me, dude? What are you telling me, dude? What are you telling me, dude? What are you telling me, dude? What are you telling me, dude? What are you telling me, dude? What are you telling me, dude? What are you telling me, dude? What are you telling me, dude? What are you telling me, dude? What are you telling me, dude? What are you telling me, dude? What are you telling me, dude? What are you telling me, dude? What are you telling me, dude? What are you telling me, dude? What are you telling me, dude? What are you telling me, dude? What are you telling me, dude? What are you telling me, dude? What are you telling me, dude? What are you telling me, dude? What are you telling me, dude? What are you telling me, dude? What are you telling me, dude? What are you telling me, dude? What are you telling me, dude? What are you telling me, dude? What are you telling me, dude? What are you telling me, dude? What are you telling me, dude? What are you telling me, dude? What are you telling me, dude? What are you telling me, dude? What are you telling me, dude? What are you telling me, dude? What are you telling me, dude? What are you telling me, dude? What are you telling me, dude? What are you telling me, dude? What are you telling me, dude? What are you telling me, dude? What are you telling me, dude? What are you telling me, dude? What are you telling me, dude? What are you telling me, dude?", + "segments": [ + { + "id": 0, + "seek": 0, + "start": 0.06, + "end": 5.92, + "text": " What are you telling me, guys?", + "tokens": [ + 708, + 366, + 291, + 3585, + 385, + 11, + 1074, + 30 + ], + "temperature": 0.0, + "avg_logprob": -0.4002814409209461, + "compression_ratio": 4.660377358490566, + "no_speech_prob": 0.5112143754959106, + "confidence": 0.343, + "words": [ + { + "text": "What", + "start": 0.06, + "end": 4.9, + "confidence": 0.041 + }, + { + "text": "are", + "start": 4.9, + "end": 5.18, + "confidence": 0.603 + }, + { + "text": "you", + "start": 5.18, + "end": 5.42, + "confidence": 0.97 + }, + { + "text": "telling", + "start": 5.42, + "end": 5.64, + "confidence": 0.354 + }, + { + "text": "me,", + "start": 5.64, + "end": 5.88, + "confidence": 0.622 + }, + { + "text": "guys?", + "start": 5.88, + "end": 5.92, + "confidence": 0.307 + } + ] + }, + { + "id": 1, + "seek": 0, + "start": 6.5, + "end": 7.5, + "text": " What are you telling me, dude?", + "tokens": [ + 708, + 366, + 291, + 3585, + 385, + 11, + 6449, + 30 + ], + "temperature": 0.0, + "avg_logprob": -0.4002814409209461, + "compression_ratio": 4.660377358490566, + "no_speech_prob": 0.5112143754959106, + "confidence": 0.677, + "words": [ + { + "text": "What", + "start": 6.5, + "end": 6.92, + "confidence": 0.885 + }, + { + "text": "are", + "start": 6.92, + "end": 6.96, + "confidence": 0.936 + }, + { + "text": "you", + "start": 6.96, + "end": 7.02, + "confidence": 0.993 + }, + { + "text": "telling", + "start": 7.02, + "end": 7.24, + "confidence": 0.904 + }, + { + "text": "me,", + "start": 7.24, + "end": 7.46, + "confidence": 0.984 + }, + { + "text": "dude?", + "start": 7.46, + "end": 7.5, + "confidence": 0.131 + } + ] + }, + { + "id": 2, + "seek": 0, + "start": 7.52, + "end": 8.28, + "text": " What are you telling me, dude?", + "tokens": [ + 708, + 366, + 291, + 3585, + 385, + 11, + 6449, + 30 + ], + "temperature": 0.0, + "avg_logprob": -0.4002814409209461, + "compression_ratio": 4.660377358490566, + "no_speech_prob": 0.5112143754959106, + "confidence": 0.827, + "words": [ + { + "text": "What", + "start": 7.52, + "end": 7.56, + "confidence": 0.545 + }, + { + "text": "are", + "start": 7.56, + "end": 7.6, + "confidence": 0.851 + }, + { + "text": "you", + "start": 7.6, + "end": 7.64, + "confidence": 0.994 + }, + { + "text": "telling", + "start": 7.64, + "end": 7.68, + "confidence": 0.849 + }, + { + "text": "me,", + "start": 7.68, + "end": 8.16, + "confidence": 0.951 + }, + { + "text": "dude?", + "start": 8.16, + "end": 8.28, + "confidence": 0.857 + } + ] + }, + { + "id": 3, + "seek": 0, + "start": 10.46, + "end": 12.48, + "text": " What are you telling me, dude?", + "tokens": [ + 708, + 366, + 291, + 3585, + 385, + 11, + 6449, + 30 + ], + "temperature": 0.0, + "avg_logprob": -0.4002814409209461, + "compression_ratio": 4.660377358490566, + "no_speech_prob": 0.5112143754959106, + "confidence": 0.774, + "words": [ + { + "text": "What", + "start": 10.46, + "end": 10.54, + "confidence": 0.422 + }, + { + "text": "are", + "start": 10.54, + "end": 10.6, + "confidence": 0.79 + }, + { + "text": "you", + "start": 10.6, + "end": 11.38, + "confidence": 0.994 + }, + { + "text": "telling", + "start": 11.38, + "end": 11.66, + "confidence": 0.809 + }, + { + "text": "me,", + "start": 11.66, + "end": 12.44, + "confidence": 0.956 + }, + { + "text": "dude?", + "start": 12.44, + "end": 12.48, + "confidence": 0.837 + } + ] + }, + { + "id": 4, + "seek": 0, + "start": 12.48, + "end": 14.46, + "text": " What are you telling me, guys?", + "tokens": [ + 708, + 366, + 291, + 3585, + 385, + 11, + 1074, + 30 + ], + "temperature": 0.0, + "avg_logprob": -0.4002814409209461, + "compression_ratio": 4.660377358490566, + "no_speech_prob": 0.5112143754959106, + "confidence": 0.762, + "words": [ + { + "text": "What", + "start": 12.48, + "end": 12.52, + "confidence": 0.504 + }, + { + "text": "are", + "start": 12.52, + "end": 12.56, + "confidence": 0.845 + }, + { + "text": "you", + "start": 12.56, + "end": 12.6, + "confidence": 0.994 + }, + { + "text": "telling", + "start": 12.6, + "end": 12.64, + "confidence": 0.844 + }, + { + "text": "me,", + "start": 12.64, + "end": 13.18, + "confidence": 0.962 + }, + { + "text": "guys?", + "start": 13.18, + "end": 14.46, + "confidence": 0.57 + } + ] + }, + { + "id": 5, + "seek": 0, + "start": 16.5, + "end": 21.3, + "text": " What are you telling me, guys?", + "tokens": [ + 708, + 366, + 291, + 3585, + 385, + 11, + 1074, + 30 + ], + "temperature": 0.0, + "avg_logprob": -0.4002814409209461, + "compression_ratio": 4.660377358490566, + "no_speech_prob": 0.5112143754959106, + "confidence": 0.936, + "words": [ + { + "text": "What", + "start": 16.5, + "end": 20.42, + "confidence": 0.887 + }, + { + "text": "are", + "start": 20.42, + "end": 20.54, + "confidence": 0.936 + }, + { + "text": "you", + "start": 20.54, + "end": 20.7, + "confidence": 0.996 + }, + { + "text": "telling", + "start": 20.7, + "end": 20.94, + "confidence": 0.934 + }, + { + "text": "me,", + "start": 20.94, + "end": 21.26, + "confidence": 0.897 + }, + { + "text": "guys?", + "start": 21.26, + "end": 21.3, + "confidence": 0.969 + } + ] + }, + { + "id": 6, + "seek": 0, + "start": 21.5, + "end": 22.78, + "text": " What are you telling me, dude?", + "tokens": [ + 708, + 366, + 291, + 3585, + 385, + 11, + 6449, + 30 + ], + "temperature": 0.0, + "avg_logprob": -0.4002814409209461, + "compression_ratio": 4.660377358490566, + "no_speech_prob": 0.5112143754959106, + "confidence": 0.953, + "words": [ + { + "text": "What", + "start": 21.5, + "end": 22.2, + "confidence": 0.951 + }, + { + "text": "are", + "start": 22.2, + "end": 22.24, + "confidence": 0.966 + }, + { + "text": "you", + "start": 22.24, + "end": 22.36, + "confidence": 0.997 + }, + { + "text": "telling", + "start": 22.36, + "end": 22.5, + "confidence": 0.862 + }, + { + "text": "me,", + "start": 22.5, + "end": 22.7, + "confidence": 0.984 + }, + { + "text": "dude?", + "start": 22.7, + "end": 22.78, + "confidence": 0.967 + } + ] + }, + { + "id": 7, + "seek": 0, + "start": 22.78, + "end": 23.02, + "text": " What are you telling me, dude?", + "tokens": [ + 708, + 366, + 291, + 3585, + 385, + 11, + 6449, + 30 + ], + "temperature": 0.0, + "avg_logprob": -0.4002814409209461, + "compression_ratio": 4.660377358490566, + "no_speech_prob": 0.5112143754959106, + "confidence": 0.856, + "words": [ + { + "text": "What", + "start": 22.78, + "end": 22.82, + "confidence": 0.54 + }, + { + "text": "are", + "start": 22.82, + "end": 22.86, + "confidence": 0.888 + }, + { + "text": "you", + "start": 22.86, + "end": 22.9, + "confidence": 0.996 + }, + { + "text": "telling", + "start": 22.9, + "end": 22.94, + "confidence": 0.882 + }, + { + "text": "me,", + "start": 22.94, + "end": 22.98, + "confidence": 0.975 + }, + { + "text": "dude?", + "start": 22.98, + "end": 23.02, + "confidence": 0.955 + } + ] + }, + { + "id": 8, + "seek": 2600, + "start": 26.02, + "end": 28.74, + "text": " What are you telling me, dude?", + "tokens": [ + 708, + 366, + 291, + 3585, + 385, + 11, + 6449, + 30 + ], + "temperature": 0.0, + "avg_logprob": -0.26995800480698096, + "compression_ratio": 9.136363636363637, + "no_speech_prob": 0.0041488660499453545, + "confidence": 0.523, + "words": [ + { + "text": "What", + "start": 26.02, + "end": 26.06, + "confidence": 0.145 + }, + { + "text": "are", + "start": 26.06, + "end": 27.16, + "confidence": 0.442 + }, + { + "text": "you", + "start": 27.16, + "end": 28.24, + "confidence": 0.944 + }, + { + "text": "telling", + "start": 28.24, + "end": 28.28, + "confidence": 0.536 + }, + { + "text": "me,", + "start": 28.28, + "end": 28.7, + "confidence": 0.926 + }, + { + "text": "dude?", + "start": 28.7, + "end": 28.74, + "confidence": 0.683 + } + ] + }, + { + "id": 9, + "seek": 2600, + "start": 30.5, + "end": 31.8, + "text": " What are you telling me, dude?", + "tokens": [ + 708, + 366, + 291, + 3585, + 385, + 11, + 6449, + 30 + ], + "temperature": 0.0, + "avg_logprob": -0.26995800480698096, + "compression_ratio": 9.136363636363637, + "no_speech_prob": 0.0041488660499453545, + "confidence": 0.586, + "words": [ + { + "text": "What", + "start": 30.5, + "end": 31.1, + "confidence": 0.193 + }, + { + "text": "are", + "start": 31.1, + "end": 31.14, + "confidence": 0.532 + }, + { + "text": "you", + "start": 31.14, + "end": 31.46, + "confidence": 0.966 + }, + { + "text": "telling", + "start": 31.46, + "end": 31.5, + "confidence": 0.588 + }, + { + "text": "me,", + "start": 31.5, + "end": 31.68, + "confidence": 0.895 + }, + { + "text": "dude?", + "start": 31.68, + "end": 31.8, + "confidence": 0.776 + } + ] + }, + { + "id": 10, + "seek": 2600, + "start": 31.8, + "end": 32.58, + "text": " What are you telling me, dude?", + "tokens": [ + 708, + 366, + 291, + 3585, + 385, + 11, + 6449, + 30 + ], + "temperature": 0.0, + "avg_logprob": -0.26995800480698096, + "compression_ratio": 9.136363636363637, + "no_speech_prob": 0.0041488660499453545, + "confidence": 0.664, + "words": [ + { + "text": "What", + "start": 31.8, + "end": 32.26, + "confidence": 0.321 + }, + { + "text": "are", + "start": 32.26, + "end": 32.3, + "confidence": 0.594 + }, + { + "text": "you", + "start": 32.3, + "end": 32.4, + "confidence": 0.972 + }, + { + "text": "telling", + "start": 32.4, + "end": 32.44, + "confidence": 0.609 + }, + { + "text": "me,", + "start": 32.44, + "end": 32.48, + "confidence": 0.891 + }, + { + "text": "dude?", + "start": 32.48, + "end": 32.58, + "confidence": 0.85 + } + ] + }, + { + "id": 11, + "seek": 2600, + "start": 33.52, + "end": 35.4, + "text": " What are you telling me, dude?", + "tokens": [ + 708, + 366, + 291, + 3585, + 385, + 11, + 6449, + 30 + ], + "temperature": 0.0, + "avg_logprob": -0.26995800480698096, + "compression_ratio": 9.136363636363637, + "no_speech_prob": 0.0041488660499453545, + "confidence": 0.711, + "words": [ + { + "text": "What", + "start": 33.52, + "end": 33.56, + "confidence": 0.44 + }, + { + "text": "are", + "start": 33.56, + "end": 33.66, + "confidence": 0.602 + }, + { + "text": "you", + "start": 33.66, + "end": 33.74, + "confidence": 0.972 + }, + { + "text": "telling", + "start": 33.74, + "end": 34.84, + "confidence": 0.635 + }, + { + "text": "me,", + "start": 34.84, + "end": 35.36, + "confidence": 0.901 + }, + { + "text": "dude?", + "start": 35.36, + "end": 35.4, + "confidence": 0.88 + } + ] + }, + { + "id": 12, + "seek": 2600, + "start": 36.24, + "end": 38.1, + "text": " What are you telling me, dude?", + "tokens": [ + 708, + 366, + 291, + 3585, + 385, + 11, + 6449, + 30 + ], + "temperature": 0.0, + "avg_logprob": -0.26995800480698096, + "compression_ratio": 9.136363636363637, + "no_speech_prob": 0.0041488660499453545, + "confidence": 0.745, + "words": [ + { + "text": "What", + "start": 36.24, + "end": 36.34, + "confidence": 0.474 + }, + { + "text": "are", + "start": 36.34, + "end": 36.38, + "confidence": 0.621 + }, + { + "text": "you", + "start": 36.38, + "end": 37.34, + "confidence": 0.973 + }, + { + "text": "telling", + "start": 37.34, + "end": 37.42, + "confidence": 0.715 + }, + { + "text": "me,", + "start": 37.42, + "end": 38.06, + "confidence": 0.929 + }, + { + "text": "dude?", + "start": 38.06, + "end": 38.1, + "confidence": 0.9 + } + ] + }, + { + "id": 13, + "seek": 2600, + "start": 38.1, + "end": 38.62, + "text": " What are you telling me, dude?", + "tokens": [ + 708, + 366, + 291, + 3585, + 385, + 11, + 6449, + 30 + ], + "temperature": 0.0, + "avg_logprob": -0.26995800480698096, + "compression_ratio": 9.136363636363637, + "no_speech_prob": 0.0041488660499453545, + "confidence": 0.787, + "words": [ + { + "text": "What", + "start": 38.1, + "end": 38.14, + "confidence": 0.555 + }, + { + "text": "are", + "start": 38.14, + "end": 38.18, + "confidence": 0.674 + }, + { + "text": "you", + "start": 38.18, + "end": 38.22, + "confidence": 0.978 + }, + { + "text": "telling", + "start": 38.22, + "end": 38.26, + "confidence": 0.751 + }, + { + "text": "me,", + "start": 38.26, + "end": 38.3, + "confidence": 0.936 + }, + { + "text": "dude?", + "start": 38.3, + "end": 38.62, + "confidence": 0.921 + } + ] + }, + { + "id": 14, + "seek": 2600, + "start": 39.52, + "end": 41.92, + "text": " What are you telling me, dude?", + "tokens": [ + 708, + 366, + 291, + 3585, + 385, + 11, + 6449, + 30 + ], + "temperature": 0.0, + "avg_logprob": -0.26995800480698096, + "compression_ratio": 9.136363636363637, + "no_speech_prob": 0.0041488660499453545, + "confidence": 0.813, + "words": [ + { + "text": "What", + "start": 39.52, + "end": 40.78, + "confidence": 0.577 + }, + { + "text": "are", + "start": 40.78, + "end": 41.06, + "confidence": 0.737 + }, + { + "text": "you", + "start": 41.06, + "end": 41.14, + "confidence": 0.982 + }, + { + "text": "telling", + "start": 41.14, + "end": 41.18, + "confidence": 0.785 + }, + { + "text": "me,", + "start": 41.18, + "end": 41.86, + "confidence": 0.941 + }, + { + "text": "dude?", + "start": 41.86, + "end": 41.92, + "confidence": 0.936 + } + ] + }, + { + "id": 15, + "seek": 2600, + "start": 41.92, + "end": 42.86, + "text": " What are you telling me, dude?", + "tokens": [ + 708, + 366, + 291, + 3585, + 385, + 11, + 6449, + 30 + ], + "temperature": 0.0, + "avg_logprob": -0.26995800480698096, + "compression_ratio": 9.136363636363637, + "no_speech_prob": 0.0041488660499453545, + "confidence": 0.834, + "words": [ + { + "text": "What", + "start": 41.92, + "end": 41.96, + "confidence": 0.644 + }, + { + "text": "are", + "start": 41.96, + "end": 42.0, + "confidence": 0.752 + }, + { + "text": "you", + "start": 42.0, + "end": 42.08, + "confidence": 0.985 + }, + { + "text": "telling", + "start": 42.08, + "end": 42.3, + "confidence": 0.788 + }, + { + "text": "me,", + "start": 42.3, + "end": 42.82, + "confidence": 0.953 + }, + { + "text": "dude?", + "start": 42.82, + "end": 42.86, + "confidence": 0.938 + } + ] + }, + { + "id": 16, + "seek": 2600, + "start": 44.5, + "end": 46.46, + "text": " What are you telling me, dude?", + "tokens": [ + 708, + 366, + 291, + 3585, + 385, + 11, + 6449, + 30 + ], + "temperature": 0.0, + "avg_logprob": -0.26995800480698096, + "compression_ratio": 9.136363636363637, + "no_speech_prob": 0.0041488660499453545, + "confidence": 0.795, + "words": [ + { + "text": "What", + "start": 44.5, + "end": 45.0, + "confidence": 0.502 + }, + { + "text": "are", + "start": 45.0, + "end": 45.64, + "confidence": 0.732 + }, + { + "text": "you", + "start": 45.64, + "end": 45.72, + "confidence": 0.985 + }, + { + "text": "telling", + "start": 45.72, + "end": 45.92, + "confidence": 0.789 + }, + { + "text": "me,", + "start": 45.92, + "end": 46.38, + "confidence": 0.952 + }, + { + "text": "dude?", + "start": 46.38, + "end": 46.46, + "confidence": 0.932 + } + ] + }, + { + "id": 17, + "seek": 2600, + "start": 46.46, + "end": 46.94, + "text": " What are you telling me, dude?", + "tokens": [ + 708, + 366, + 291, + 3585, + 385, + 11, + 6449, + 30 + ], + "temperature": 0.0, + "avg_logprob": -0.26995800480698096, + "compression_ratio": 9.136363636363637, + "no_speech_prob": 0.0041488660499453545, + "confidence": 0.789, + "words": [ + { + "text": "What", + "start": 46.46, + "end": 46.5, + "confidence": 0.481 + }, + { + "text": "are", + "start": 46.5, + "end": 46.54, + "confidence": 0.742 + }, + { + "text": "you", + "start": 46.54, + "end": 46.58, + "confidence": 0.987 + }, + { + "text": "telling", + "start": 46.58, + "end": 46.62, + "confidence": 0.779 + }, + { + "text": "me,", + "start": 46.62, + "end": 46.66, + "confidence": 0.948 + }, + { + "text": "dude?", + "start": 46.66, + "end": 46.94, + "confidence": 0.932 + } + ] + }, + { + "id": 18, + "seek": 2600, + "start": 47.52, + "end": 48.46, + "text": " What are you telling me, dude?", + "tokens": [ + 708, + 366, + 291, + 3585, + 385, + 11, + 6449, + 30 + ], + "temperature": 0.0, + "avg_logprob": -0.26995800480698096, + "compression_ratio": 9.136363636363637, + "no_speech_prob": 0.0041488660499453545, + "confidence": 0.792, + "words": [ + { + "text": "What", + "start": 47.52, + "end": 47.56, + "confidence": 0.479 + }, + { + "text": "are", + "start": 47.56, + "end": 48.04, + "confidence": 0.746 + }, + { + "text": "you", + "start": 48.04, + "end": 48.1, + "confidence": 0.987 + }, + { + "text": "telling", + "start": 48.1, + "end": 48.28, + "confidence": 0.785 + }, + { + "text": "me,", + "start": 48.28, + "end": 48.42, + "confidence": 0.95 + }, + { + "text": "dude?", + "start": 48.42, + "end": 48.46, + "confidence": 0.936 + } + ] + }, + { + "id": 19, + "seek": 2600, + "start": 49.52, + "end": 51.38, + "text": " What are you telling me, dude?", + "tokens": [ + 708, + 366, + 291, + 3585, + 385, + 11, + 6449, + 30 + ], + "temperature": 0.0, + "avg_logprob": -0.26995800480698096, + "compression_ratio": 9.136363636363637, + "no_speech_prob": 0.0041488660499453545, + "confidence": 0.838, + "words": [ + { + "text": "What", + "start": 49.52, + "end": 50.24, + "confidence": 0.651 + }, + { + "text": "are", + "start": 50.24, + "end": 50.48, + "confidence": 0.757 + }, + { + "text": "you", + "start": 50.48, + "end": 50.56, + "confidence": 0.989 + }, + { + "text": "telling", + "start": 50.56, + "end": 50.6, + "confidence": 0.793 + }, + { + "text": "me,", + "start": 50.6, + "end": 51.32, + "confidence": 0.95 + }, + { + "text": "dude?", + "start": 51.32, + "end": 51.38, + "confidence": 0.943 + } + ] + }, + { + "id": 20, + "seek": 2600, + "start": 51.98, + "end": 54.06, + "text": " What are you telling me, dude?", + "tokens": [ + 708, + 366, + 291, + 3585, + 385, + 11, + 6449, + 30 + ], + "temperature": 0.0, + "avg_logprob": -0.26995800480698096, + "compression_ratio": 9.136363636363637, + "no_speech_prob": 0.0041488660499453545, + "confidence": 0.78, + "words": [ + { + "text": "What", + "start": 51.98, + "end": 52.14, + "confidence": 0.43 + }, + { + "text": "are", + "start": 52.14, + "end": 52.62, + "confidence": 0.737 + }, + { + "text": "you", + "start": 52.62, + "end": 52.72, + "confidence": 0.988 + }, + { + "text": "telling", + "start": 52.72, + "end": 52.88, + "confidence": 0.81 + }, + { + "text": "me,", + "start": 52.88, + "end": 54.02, + "confidence": 0.943 + }, + { + "text": "dude?", + "start": 54.02, + "end": 54.06, + "confidence": 0.944 + } + ] + }, + { + "id": 21, + "seek": 5400, + "start": 54.06, + "end": 55.0, + "text": " What are you telling me, dude?", + "tokens": [ + 708, + 366, + 291, + 3585, + 385, + 11, + 6449, + 30 + ], + "temperature": 0.0, + "avg_logprob": -0.17690415449545416, + "compression_ratio": 9.840909090909092, + "no_speech_prob": 0.0238738264888525, + "confidence": 0.7, + "words": [ + { + "text": "What", + "start": 54.06, + "end": 54.1, + "confidence": 0.506 + }, + { + "text": "are", + "start": 54.1, + "end": 54.2, + "confidence": 0.588 + }, + { + "text": "you", + "start": 54.2, + "end": 54.46, + "confidence": 0.876 + }, + { + "text": "telling", + "start": 54.46, + "end": 54.5, + "confidence": 0.747 + }, + { + "text": "me,", + "start": 54.5, + "end": 54.96, + "confidence": 0.71 + }, + { + "text": "dude?", + "start": 54.96, + "end": 55.0, + "confidence": 0.848 + } + ] + }, + { + "id": 22, + "seek": 5400, + "start": 56.5, + "end": 58.0, + "text": " What are you telling me, dude?", + "tokens": [ + 708, + 366, + 291, + 3585, + 385, + 11, + 6449, + 30 + ], + "temperature": 0.0, + "avg_logprob": -0.17690415449545416, + "compression_ratio": 9.840909090909092, + "no_speech_prob": 0.0238738264888525, + "confidence": 0.739, + "words": [ + { + "text": "What", + "start": 56.5, + "end": 56.82, + "confidence": 0.512 + }, + { + "text": "are", + "start": 56.82, + "end": 56.92, + "confidence": 0.568 + }, + { + "text": "you", + "start": 56.92, + "end": 57.12, + "confidence": 0.964 + }, + { + "text": "telling", + "start": 57.12, + "end": 57.16, + "confidence": 0.808 + }, + { + "text": "me,", + "start": 57.16, + "end": 57.96, + "confidence": 0.803 + }, + { + "text": "dude?", + "start": 57.96, + "end": 58.0, + "confidence": 0.897 + } + ] + }, + { + "id": 23, + "seek": 5400, + "start": 58.0, + "end": 58.9, + "text": " What are you telling me, dude?", + "tokens": [ + 708, + 366, + 291, + 3585, + 385, + 11, + 6449, + 30 + ], + "temperature": 0.0, + "avg_logprob": -0.17690415449545416, + "compression_ratio": 9.840909090909092, + "no_speech_prob": 0.0238738264888525, + "confidence": 0.741, + "words": [ + { + "text": "What", + "start": 58.0, + "end": 58.64, + "confidence": 0.48 + }, + { + "text": "are", + "start": 58.64, + "end": 58.68, + "confidence": 0.584 + }, + { + "text": "you", + "start": 58.68, + "end": 58.78, + "confidence": 0.954 + }, + { + "text": "telling", + "start": 58.78, + "end": 58.82, + "confidence": 0.816 + }, + { + "text": "me,", + "start": 58.82, + "end": 58.86, + "confidence": 0.837 + }, + { + "text": "dude?", + "start": 58.86, + "end": 58.9, + "confidence": 0.908 + } + ] + }, + { + "id": 24, + "seek": 5400, + "start": 59.52, + "end": 60.5, + "text": " What are you telling me, dude?", + "tokens": [ + 708, + 366, + 291, + 3585, + 385, + 11, + 6449, + 30 + ], + "temperature": 0.0, + "avg_logprob": -0.17690415449545416, + "compression_ratio": 9.840909090909092, + "no_speech_prob": 0.0238738264888525, + "confidence": 0.783, + "words": [ + { + "text": "What", + "start": 59.52, + "end": 60.02, + "confidence": 0.58 + }, + { + "text": "are", + "start": 60.02, + "end": 60.18, + "confidence": 0.641 + }, + { + "text": "you", + "start": 60.18, + "end": 60.22, + "confidence": 0.967 + }, + { + "text": "telling", + "start": 60.22, + "end": 60.26, + "confidence": 0.826 + }, + { + "text": "me,", + "start": 60.26, + "end": 60.38, + "confidence": 0.853 + }, + { + "text": "dude?", + "start": 60.38, + "end": 60.5, + "confidence": 0.911 + } + ] + }, + { + "id": 25, + "seek": 5400, + "start": 61.52, + "end": 62.82, + "text": " What are you telling me, dude?", + "tokens": [ + 708, + 366, + 291, + 3585, + 385, + 11, + 6449, + 30 + ], + "temperature": 0.0, + "avg_logprob": -0.17690415449545416, + "compression_ratio": 9.840909090909092, + "no_speech_prob": 0.0238738264888525, + "confidence": 0.803, + "words": [ + { + "text": "What", + "start": 61.52, + "end": 62.34, + "confidence": 0.613 + }, + { + "text": "are", + "start": 62.34, + "end": 62.38, + "confidence": 0.66 + }, + { + "text": "you", + "start": 62.38, + "end": 62.42, + "confidence": 0.967 + }, + { + "text": "telling", + "start": 62.42, + "end": 62.74, + "confidence": 0.835 + }, + { + "text": "me,", + "start": 62.74, + "end": 62.78, + "confidence": 0.892 + }, + { + "text": "dude?", + "start": 62.78, + "end": 62.82, + "confidence": 0.918 + } + ] + }, + { + "id": 26, + "seek": 5400, + "start": 63.52, + "end": 65.59, + "text": " What are you telling me, dude?", + "tokens": [ + 708, + 366, + 291, + 3585, + 385, + 11, + 6449, + 30 + ], + "temperature": 0.0, + "avg_logprob": -0.17690415449545416, + "compression_ratio": 9.840909090909092, + "no_speech_prob": 0.0238738264888525, + "confidence": 0.835, + "words": [ + { + "text": "What", + "start": 63.52, + "end": 64.12, + "confidence": 0.731 + }, + { + "text": "are", + "start": 64.12, + "end": 64.26, + "confidence": 0.666 + }, + { + "text": "you", + "start": 64.26, + "end": 64.3, + "confidence": 0.971 + }, + { + "text": "telling", + "start": 64.3, + "end": 64.6, + "confidence": 0.864 + }, + { + "text": "me,", + "start": 64.6, + "end": 65.02, + "confidence": 0.902 + }, + { + "text": "dude?", + "start": 65.02, + "end": 65.59, + "confidence": 0.92 + } + ] + }, + { + "id": 27, + "seek": 5400, + "start": 65.59, + "end": 66.94, + "text": " What are you telling me, dude?", + "tokens": [ + 708, + 366, + 291, + 3585, + 385, + 11, + 6449, + 30 + ], + "temperature": 0.0, + "avg_logprob": -0.17690415449545416, + "compression_ratio": 9.840909090909092, + "no_speech_prob": 0.0238738264888525, + "confidence": 0.825, + "words": [ + { + "text": "What", + "start": 65.59, + "end": 65.84, + "confidence": 0.635 + }, + { + "text": "are", + "start": 65.84, + "end": 65.88, + "confidence": 0.691 + }, + { + "text": "you", + "start": 65.88, + "end": 65.92, + "confidence": 0.975 + }, + { + "text": "telling", + "start": 65.92, + "end": 65.96, + "confidence": 0.866 + }, + { + "text": "me,", + "start": 65.96, + "end": 66.86, + "confidence": 0.918 + }, + { + "text": "dude?", + "start": 66.86, + "end": 66.94, + "confidence": 0.927 + } + ] + }, + { + "id": 28, + "seek": 5400, + "start": 67.52, + "end": 69.18, + "text": " What are you telling me, dude?", + "tokens": [ + 708, + 366, + 291, + 3585, + 385, + 11, + 6449, + 30 + ], + "temperature": 0.0, + "avg_logprob": -0.17690415449545416, + "compression_ratio": 9.840909090909092, + "no_speech_prob": 0.0238738264888525, + "confidence": 0.821, + "words": [ + { + "text": "What", + "start": 67.52, + "end": 67.76, + "confidence": 0.572 + }, + { + "text": "are", + "start": 67.76, + "end": 67.9, + "confidence": 0.721 + }, + { + "text": "you", + "start": 67.9, + "end": 67.98, + "confidence": 0.979 + }, + { + "text": "telling", + "start": 67.98, + "end": 68.06, + "confidence": 0.88 + }, + { + "text": "me,", + "start": 68.06, + "end": 68.74, + "confidence": 0.923 + }, + { + "text": "dude?", + "start": 68.74, + "end": 69.18, + "confidence": 0.931 + } + ] + }, + { + "id": 29, + "seek": 5400, + "start": 69.86, + "end": 72.14, + "text": " What are you telling me, dude?", + "tokens": [ + 708, + 366, + 291, + 3585, + 385, + 11, + 6449, + 30 + ], + "temperature": 0.0, + "avg_logprob": -0.17690415449545416, + "compression_ratio": 9.840909090909092, + "no_speech_prob": 0.0238738264888525, + "confidence": 0.831, + "words": [ + { + "text": "What", + "start": 69.86, + "end": 69.9, + "confidence": 0.61 + }, + { + "text": "are", + "start": 69.9, + "end": 70.14, + "confidence": 0.724 + }, + { + "text": "you", + "start": 70.14, + "end": 70.54, + "confidence": 0.98 + }, + { + "text": "telling", + "start": 70.54, + "end": 71.0, + "confidence": 0.876 + }, + { + "text": "me,", + "start": 71.0, + "end": 71.9, + "confidence": 0.928 + }, + { + "text": "dude?", + "start": 71.9, + "end": 72.14, + "confidence": 0.932 + } + ] + }, + { + "id": 30, + "seek": 5400, + "start": 72.14, + "end": 72.76, + "text": " What are you telling me, dude?", + "tokens": [ + 708, + 366, + 291, + 3585, + 385, + 11, + 6449, + 30 + ], + "temperature": 0.0, + "avg_logprob": -0.17690415449545416, + "compression_ratio": 9.840909090909092, + "no_speech_prob": 0.0238738264888525, + "confidence": 0.813, + "words": [ + { + "text": "What", + "start": 72.14, + "end": 72.4, + "confidence": 0.516 + }, + { + "text": "are", + "start": 72.4, + "end": 72.44, + "confidence": 0.736 + }, + { + "text": "you", + "start": 72.44, + "end": 72.52, + "confidence": 0.982 + }, + { + "text": "telling", + "start": 72.52, + "end": 72.6, + "confidence": 0.88 + }, + { + "text": "me,", + "start": 72.6, + "end": 72.72, + "confidence": 0.943 + }, + { + "text": "dude?", + "start": 72.72, + "end": 72.76, + "confidence": 0.937 + } + ] + }, + { + "id": 31, + "seek": 5400, + "start": 74.08, + "end": 76.34, + "text": " What are you telling me, dude?", + "tokens": [ + 708, + 366, + 291, + 3585, + 385, + 11, + 6449, + 30 + ], + "temperature": 0.0, + "avg_logprob": -0.17690415449545416, + "compression_ratio": 9.840909090909092, + "no_speech_prob": 0.0238738264888525, + "confidence": 0.85, + "words": [ + { + "text": "What", + "start": 74.08, + "end": 74.32, + "confidence": 0.651 + }, + { + "text": "are", + "start": 74.32, + "end": 74.36, + "confidence": 0.755 + }, + { + "text": "you", + "start": 74.36, + "end": 74.94, + "confidence": 0.984 + }, + { + "text": "telling", + "start": 74.94, + "end": 75.56, + "confidence": 0.88 + }, + { + "text": "me,", + "start": 75.56, + "end": 76.3, + "confidence": 0.943 + }, + { + "text": "dude?", + "start": 76.3, + "end": 76.34, + "confidence": 0.937 + } + ] + }, + { + "id": 32, + "seek": 5400, + "start": 76.34, + "end": 77.98, + "text": " What are you telling me, dude?", + "tokens": [ + 708, + 366, + 291, + 3585, + 385, + 11, + 6449, + 30 + ], + "temperature": 0.0, + "avg_logprob": -0.17690415449545416, + "compression_ratio": 9.840909090909092, + "no_speech_prob": 0.0238738264888525, + "confidence": 0.839, + "words": [ + { + "text": "What", + "start": 76.34, + "end": 77.38, + "confidence": 0.607 + }, + { + "text": "are", + "start": 77.38, + "end": 77.42, + "confidence": 0.759 + }, + { + "text": "you", + "start": 77.42, + "end": 77.46, + "confidence": 0.985 + }, + { + "text": "telling", + "start": 77.46, + "end": 77.54, + "confidence": 0.879 + }, + { + "text": "me,", + "start": 77.54, + "end": 77.94, + "confidence": 0.938 + }, + { + "text": "dude?", + "start": 77.94, + "end": 77.98, + "confidence": 0.936 + } + ] + }, + { + "id": 33, + "seek": 5400, + "start": 77.98, + "end": 79.08, + "text": " What are you telling me, dude?", + "tokens": [ + 708, + 366, + 291, + 3585, + 385, + 11, + 6449, + 30 + ], + "temperature": 0.0, + "avg_logprob": -0.17690415449545416, + "compression_ratio": 9.840909090909092, + "no_speech_prob": 0.0238738264888525, + "confidence": 0.85, + "words": [ + { + "text": "What", + "start": 77.98, + "end": 78.02, + "confidence": 0.636 + }, + { + "text": "are", + "start": 78.02, + "end": 78.06, + "confidence": 0.75 + }, + { + "text": "you", + "start": 78.06, + "end": 78.92, + "confidence": 0.985 + }, + { + "text": "telling", + "start": 78.92, + "end": 78.96, + "confidence": 0.894 + }, + { + "text": "me,", + "start": 78.96, + "end": 79.04, + "confidence": 0.954 + }, + { + "text": "dude?", + "start": 79.04, + "end": 79.08, + "confidence": 0.939 + } + ] + }, + { + "id": 34, + "seek": 5400, + "start": 80.22, + "end": 81.66, + "text": " What are you telling me, dude?", + "tokens": [ + 708, + 366, + 291, + 3585, + 385, + 11, + 6449, + 30 + ], + "temperature": 0.0, + "avg_logprob": -0.17690415449545416, + "compression_ratio": 9.840909090909092, + "no_speech_prob": 0.0238738264888525, + "confidence": 0.813, + "words": [ + { + "text": "What", + "start": 80.22, + "end": 80.26, + "confidence": 0.484 + }, + { + "text": "are", + "start": 80.26, + "end": 80.6, + "confidence": 0.745 + }, + { + "text": "you", + "start": 80.6, + "end": 80.68, + "confidence": 0.985 + }, + { + "text": "telling", + "start": 80.68, + "end": 80.96, + "confidence": 0.899 + }, + { + "text": "me,", + "start": 80.96, + "end": 81.62, + "confidence": 0.96 + }, + { + "text": "dude?", + "start": 81.62, + "end": 81.66, + "confidence": 0.942 + } + ] + }, + { + "id": 35, + "seek": 8200, + "start": 82.02, + "end": 83.08, + "text": " What are you telling me, dude?", + "tokens": [ + 708, + 366, + 291, + 3585, + 385, + 11, + 6449, + 30 + ], + "temperature": 0.0, + "avg_logprob": -0.1252204868155466, + "compression_ratio": 9.840909090909092, + "no_speech_prob": 0.0009642249788157642, + "confidence": 0.772, + "words": [ + { + "text": "What", + "start": 82.02, + "end": 82.06, + "confidence": 0.701 + }, + { + "text": "are", + "start": 82.06, + "end": 82.28, + "confidence": 0.488 + }, + { + "text": "you", + "start": 82.28, + "end": 82.38, + "confidence": 0.934 + }, + { + "text": "telling", + "start": 82.38, + "end": 82.42, + "confidence": 0.755 + }, + { + "text": "me,", + "start": 82.42, + "end": 82.86, + "confidence": 0.92 + }, + { + "text": "dude?", + "start": 82.86, + "end": 83.08, + "confidence": 0.956 + } + ] + }, + { + "id": 36, + "seek": 8200, + "start": 84.34, + "end": 85.3, + "text": " What are you telling me, dude?", + "tokens": [ + 708, + 366, + 291, + 3585, + 385, + 11, + 6449, + 30 + ], + "temperature": 0.0, + "avg_logprob": -0.1252204868155466, + "compression_ratio": 9.840909090909092, + "no_speech_prob": 0.0009642249788157642, + "confidence": 0.786, + "words": [ + { + "text": "What", + "start": 84.34, + "end": 84.38, + "confidence": 0.529 + }, + { + "text": "are", + "start": 84.38, + "end": 84.64, + "confidence": 0.637 + }, + { + "text": "you", + "start": 84.64, + "end": 85.12, + "confidence": 0.969 + }, + { + "text": "telling", + "start": 85.12, + "end": 85.16, + "confidence": 0.815 + }, + { + "text": "me,", + "start": 85.16, + "end": 85.26, + "confidence": 0.932 + }, + { + "text": "dude?", + "start": 85.26, + "end": 85.3, + "confidence": 0.952 + } + ] + }, + { + "id": 37, + "seek": 8200, + "start": 85.52, + "end": 87.94, + "text": " What are you telling me, dude?", + "tokens": [ + 708, + 366, + 291, + 3585, + 385, + 11, + 6449, + 30 + ], + "temperature": 0.0, + "avg_logprob": -0.1252204868155466, + "compression_ratio": 9.840909090909092, + "no_speech_prob": 0.0009642249788157642, + "confidence": 0.836, + "words": [ + { + "text": "What", + "start": 85.52, + "end": 86.82, + "confidence": 0.676 + }, + { + "text": "are", + "start": 86.82, + "end": 86.86, + "confidence": 0.703 + }, + { + "text": "you", + "start": 86.86, + "end": 86.98, + "confidence": 0.97 + }, + { + "text": "telling", + "start": 86.98, + "end": 87.02, + "confidence": 0.826 + }, + { + "text": "me,", + "start": 87.02, + "end": 87.9, + "confidence": 0.942 + }, + { + "text": "dude?", + "start": 87.9, + "end": 87.94, + "confidence": 0.955 + } + ] + }, + { + "id": 38, + "seek": 8200, + "start": 87.94, + "end": 89.56, + "text": " What are you telling me, dude?", + "tokens": [ + 708, + 366, + 291, + 3585, + 385, + 11, + 6449, + 30 + ], + "temperature": 0.0, + "avg_logprob": -0.1252204868155466, + "compression_ratio": 9.840909090909092, + "no_speech_prob": 0.0009642249788157642, + "confidence": 0.849, + "words": [ + { + "text": "What", + "start": 87.94, + "end": 88.34, + "confidence": 0.7 + }, + { + "text": "are", + "start": 88.34, + "end": 89.16, + "confidence": 0.717 + }, + { + "text": "you", + "start": 89.16, + "end": 89.44, + "confidence": 0.976 + }, + { + "text": "telling", + "start": 89.44, + "end": 89.48, + "confidence": 0.84 + }, + { + "text": "me,", + "start": 89.48, + "end": 89.52, + "confidence": 0.954 + }, + { + "text": "dude?", + "start": 89.52, + "end": 89.56, + "confidence": 0.954 + } + ] + }, + { + "id": 39, + "seek": 8200, + "start": 89.94, + "end": 90.9, + "text": " What are you telling me, dude?", + "tokens": [ + 708, + 366, + 291, + 3585, + 385, + 11, + 6449, + 30 + ], + "temperature": 0.0, + "avg_logprob": -0.1252204868155466, + "compression_ratio": 9.840909090909092, + "no_speech_prob": 0.0009642249788157642, + "confidence": 0.859, + "words": [ + { + "text": "What", + "start": 89.94, + "end": 90.1, + "confidence": 0.747 + }, + { + "text": "are", + "start": 90.1, + "end": 90.14, + "confidence": 0.718 + }, + { + "text": "you", + "start": 90.14, + "end": 90.28, + "confidence": 0.976 + }, + { + "text": "telling", + "start": 90.28, + "end": 90.5, + "confidence": 0.847 + }, + { + "text": "me,", + "start": 90.5, + "end": 90.86, + "confidence": 0.944 + }, + { + "text": "dude?", + "start": 90.86, + "end": 90.9, + "confidence": 0.959 + } + ] + }, + { + "id": 40, + "seek": 8200, + "start": 91.52, + "end": 92.2, + "text": " What are you telling me, dude?", + "tokens": [ + 708, + 366, + 291, + 3585, + 385, + 11, + 6449, + 30 + ], + "temperature": 0.0, + "avg_logprob": -0.1252204868155466, + "compression_ratio": 9.840909090909092, + "no_speech_prob": 0.0009642249788157642, + "confidence": 0.851, + "words": [ + { + "text": "What", + "start": 91.52, + "end": 91.6, + "confidence": 0.723 + }, + { + "text": "are", + "start": 91.6, + "end": 91.64, + "confidence": 0.718 + }, + { + "text": "you", + "start": 91.64, + "end": 91.68, + "confidence": 0.978 + }, + { + "text": "telling", + "start": 91.68, + "end": 91.72, + "confidence": 0.83 + }, + { + "text": "me,", + "start": 91.72, + "end": 92.16, + "confidence": 0.944 + }, + { + "text": "dude?", + "start": 92.16, + "end": 92.2, + "confidence": 0.958 + } + ] + }, + { + "id": 41, + "seek": 8200, + "start": 93.52, + "end": 94.66, + "text": " What are you telling me, dude?", + "tokens": [ + 708, + 366, + 291, + 3585, + 385, + 11, + 6449, + 30 + ], + "temperature": 0.0, + "avg_logprob": -0.1252204868155466, + "compression_ratio": 9.840909090909092, + "no_speech_prob": 0.0009642249788157642, + "confidence": 0.862, + "words": [ + { + "text": "What", + "start": 93.52, + "end": 94.04, + "confidence": 0.743 + }, + { + "text": "are", + "start": 94.04, + "end": 94.08, + "confidence": 0.73 + }, + { + "text": "you", + "start": 94.08, + "end": 94.24, + "confidence": 0.981 + }, + { + "text": "telling", + "start": 94.24, + "end": 94.28, + "confidence": 0.848 + }, + { + "text": "me,", + "start": 94.28, + "end": 94.36, + "confidence": 0.949 + }, + { + "text": "dude?", + "start": 94.36, + "end": 94.66, + "confidence": 0.962 + } + ] + }, + { + "id": 42, + "seek": 8200, + "start": 95.52, + "end": 98.44, + "text": " What are you telling me, dude?", + "tokens": [ + 708, + 366, + 291, + 3585, + 385, + 11, + 6449, + 30 + ], + "temperature": 0.0, + "avg_logprob": -0.1252204868155466, + "compression_ratio": 9.840909090909092, + "no_speech_prob": 0.0009642249788157642, + "confidence": 0.867, + "words": [ + { + "text": "What", + "start": 95.52, + "end": 97.08, + "confidence": 0.72 + }, + { + "text": "are", + "start": 97.08, + "end": 97.16, + "confidence": 0.762 + }, + { + "text": "you", + "start": 97.16, + "end": 97.28, + "confidence": 0.984 + }, + { + "text": "telling", + "start": 97.28, + "end": 97.72, + "confidence": 0.862 + }, + { + "text": "me,", + "start": 97.72, + "end": 98.4, + "confidence": 0.951 + }, + { + "text": "dude?", + "start": 98.4, + "end": 98.44, + "confidence": 0.962 + } + ] + }, + { + "id": 43, + "seek": 8200, + "start": 98.44, + "end": 98.9, + "text": " What are you telling me, dude?", + "tokens": [ + 708, + 366, + 291, + 3585, + 385, + 11, + 6449, + 30 + ], + "temperature": 0.0, + "avg_logprob": -0.1252204868155466, + "compression_ratio": 9.840909090909092, + "no_speech_prob": 0.0009642249788157642, + "confidence": 0.885, + "words": [ + { + "text": "What", + "start": 98.44, + "end": 98.48, + "confidence": 0.77 + }, + { + "text": "are", + "start": 98.48, + "end": 98.52, + "confidence": 0.781 + }, + { + "text": "you", + "start": 98.52, + "end": 98.78, + "confidence": 0.986 + }, + { + "text": "telling", + "start": 98.78, + "end": 98.82, + "confidence": 0.867 + }, + { + "text": "me,", + "start": 98.82, + "end": 98.86, + "confidence": 0.965 + }, + { + "text": "dude?", + "start": 98.86, + "end": 98.9, + "confidence": 0.965 + } + ] + }, + { + "id": 44, + "seek": 8200, + "start": 99.52, + "end": 101.8, + "text": " What are you telling me, dude?", + "tokens": [ + 708, + 366, + 291, + 3585, + 385, + 11, + 6449, + 30 + ], + "temperature": 0.0, + "avg_logprob": -0.1252204868155466, + "compression_ratio": 9.840909090909092, + "no_speech_prob": 0.0009642249788157642, + "confidence": 0.887, + "words": [ + { + "text": "What", + "start": 99.52, + "end": 101.06, + "confidence": 0.741 + }, + { + "text": "are", + "start": 101.06, + "end": 101.1, + "confidence": 0.806 + }, + { + "text": "you", + "start": 101.1, + "end": 101.14, + "confidence": 0.989 + }, + { + "text": "telling", + "start": 101.14, + "end": 101.44, + "confidence": 0.88 + }, + { + "text": "me,", + "start": 101.44, + "end": 101.76, + "confidence": 0.972 + }, + { + "text": "dude?", + "start": 101.76, + "end": 101.8, + "confidence": 0.966 + } + ] + }, + { + "id": 45, + "seek": 8200, + "start": 101.8, + "end": 103.02, + "text": " What are you telling me, dude?", + "tokens": [ + 708, + 366, + 291, + 3585, + 385, + 11, + 6449, + 30 + ], + "temperature": 0.0, + "avg_logprob": -0.1252204868155466, + "compression_ratio": 9.840909090909092, + "no_speech_prob": 0.0009642249788157642, + "confidence": 0.881, + "words": [ + { + "text": "What", + "start": 101.8, + "end": 102.82, + "confidence": 0.731 + }, + { + "text": "are", + "start": 102.82, + "end": 102.86, + "confidence": 0.796 + }, + { + "text": "you", + "start": 102.86, + "end": 102.9, + "confidence": 0.988 + }, + { + "text": "telling", + "start": 102.9, + "end": 102.94, + "confidence": 0.868 + }, + { + "text": "me,", + "start": 102.94, + "end": 102.98, + "confidence": 0.971 + }, + { + "text": "dude?", + "start": 102.98, + "end": 103.02, + "confidence": 0.966 + } + ] + }, + { + "id": 46, + "seek": 8200, + "start": 104.5, + "end": 105.34, + "text": " What are you telling me, dude?", + "tokens": [ + 708, + 366, + 291, + 3585, + 385, + 11, + 6449, + 30 + ], + "temperature": 0.0, + "avg_logprob": -0.1252204868155466, + "compression_ratio": 9.840909090909092, + "no_speech_prob": 0.0009642249788157642, + "confidence": 0.888, + "words": [ + { + "text": "What", + "start": 104.5, + "end": 104.82, + "confidence": 0.737 + }, + { + "text": "are", + "start": 104.82, + "end": 105.16, + "confidence": 0.806 + }, + { + "text": "you", + "start": 105.16, + "end": 105.2, + "confidence": 0.99 + }, + { + "text": "telling", + "start": 105.2, + "end": 105.24, + "confidence": 0.885 + }, + { + "text": "me,", + "start": 105.24, + "end": 105.3, + "confidence": 0.974 + }, + { + "text": "dude?", + "start": 105.3, + "end": 105.34, + "confidence": 0.967 + } + ] + }, + { + "id": 47, + "seek": 8200, + "start": 106.5, + "end": 108.02, + "text": " What are you telling me, dude?", + "tokens": [ + 708, + 366, + 291, + 3585, + 385, + 11, + 6449, + 30 + ], + "temperature": 0.0, + "avg_logprob": -0.1252204868155466, + "compression_ratio": 9.840909090909092, + "no_speech_prob": 0.0009642249788157642, + "confidence": 0.874, + "words": [ + { + "text": "What", + "start": 106.5, + "end": 106.92, + "confidence": 0.697 + }, + { + "text": "are", + "start": 106.92, + "end": 107.1, + "confidence": 0.786 + }, + { + "text": "you", + "start": 107.1, + "end": 107.14, + "confidence": 0.99 + }, + { + "text": "telling", + "start": 107.14, + "end": 107.18, + "confidence": 0.876 + }, + { + "text": "me,", + "start": 107.18, + "end": 107.76, + "confidence": 0.971 + }, + { + "text": "dude?", + "start": 107.76, + "end": 108.02, + "confidence": 0.968 + } + ] + }, + { + "id": 48, + "seek": 8200, + "start": 108.02, + "end": 109.54, + "text": " What are you telling me, dude?", + "tokens": [ + 708, + 366, + 291, + 3585, + 385, + 11, + 6449, + 30 + ], + "temperature": 0.0, + "avg_logprob": -0.1252204868155466, + "compression_ratio": 9.840909090909092, + "no_speech_prob": 0.0009642249788157642, + "confidence": 0.82, + "words": [ + { + "text": "What", + "start": 108.02, + "end": 108.06, + "confidence": 0.48 + }, + { + "text": "are", + "start": 108.06, + "end": 108.2, + "confidence": 0.773 + }, + { + "text": "you", + "start": 108.2, + "end": 108.24, + "confidence": 0.99 + }, + { + "text": "telling", + "start": 108.24, + "end": 108.34, + "confidence": 0.878 + }, + { + "text": "me,", + "start": 108.34, + "end": 109.48, + "confidence": 0.97 + }, + { + "text": "dude?", + "start": 109.48, + "end": 109.54, + "confidence": 0.97 + } + ] + }, + { + "id": 49, + "seek": 11000, + "start": 110.02, + "end": 110.56, + "text": " What are you telling me, dude?", + "tokens": [ + 708, + 366, + 291, + 3585, + 385, + 11, + 6449, + 30 + ], + "temperature": 0.0, + "avg_logprob": -0.1162933564521897, + "compression_ratio": 9.840909090909092, + "no_speech_prob": 0.0005178684368729591, + "confidence": 0.719, + "words": [ + { + "text": "What", + "start": 110.02, + "end": 110.16, + "confidence": 0.419 + }, + { + "text": "are", + "start": 110.16, + "end": 110.2, + "confidence": 0.523 + }, + { + "text": "you", + "start": 110.2, + "end": 110.24, + "confidence": 0.913 + }, + { + "text": "telling", + "start": 110.24, + "end": 110.48, + "confidence": 0.79 + }, + { + "text": "me,", + "start": 110.48, + "end": 110.52, + "confidence": 0.904 + }, + { + "text": "dude?", + "start": 110.52, + "end": 110.56, + "confidence": 0.964 + } + ] + }, + { + "id": 50, + "seek": 11000, + "start": 112.14, + "end": 113.52, + "text": " What are you telling me, dude?", + "tokens": [ + 708, + 366, + 291, + 3585, + 385, + 11, + 6449, + 30 + ], + "temperature": 0.0, + "avg_logprob": -0.1162933564521897, + "compression_ratio": 9.840909090909092, + "no_speech_prob": 0.0005178684368729591, + "confidence": 0.835, + "words": [ + { + "text": "What", + "start": 112.14, + "end": 112.3, + "confidence": 0.644 + }, + { + "text": "are", + "start": 112.3, + "end": 113.22, + "confidence": 0.734 + }, + { + "text": "you", + "start": 113.22, + "end": 113.4, + "confidence": 0.978 + }, + { + "text": "telling", + "start": 113.4, + "end": 113.44, + "confidence": 0.821 + }, + { + "text": "me,", + "start": 113.44, + "end": 113.48, + "confidence": 0.933 + }, + { + "text": "dude?", + "start": 113.48, + "end": 113.52, + "confidence": 0.962 + } + ] + }, + { + "id": 51, + "seek": 11000, + "start": 113.9, + "end": 114.9, + "text": " What are you telling me, dude?", + "tokens": [ + 708, + 366, + 291, + 3585, + 385, + 11, + 6449, + 30 + ], + "temperature": 0.0, + "avg_logprob": -0.1162933564521897, + "compression_ratio": 9.840909090909092, + "no_speech_prob": 0.0005178684368729591, + "confidence": 0.832, + "words": [ + { + "text": "What", + "start": 113.9, + "end": 114.06, + "confidence": 0.615 + }, + { + "text": "are", + "start": 114.06, + "end": 114.16, + "confidence": 0.733 + }, + { + "text": "you", + "start": 114.16, + "end": 114.36, + "confidence": 0.978 + }, + { + "text": "telling", + "start": 114.36, + "end": 114.4, + "confidence": 0.832 + }, + { + "text": "me,", + "start": 114.4, + "end": 114.86, + "confidence": 0.934 + }, + { + "text": "dude?", + "start": 114.86, + "end": 114.9, + "confidence": 0.967 + } + ] + }, + { + "id": 52, + "seek": 11000, + "start": 115.52, + "end": 117.54, + "text": " What are you telling me, dude?", + "tokens": [ + 708, + 366, + 291, + 3585, + 385, + 11, + 6449, + 30 + ], + "temperature": 0.0, + "avg_logprob": -0.1162933564521897, + "compression_ratio": 9.840909090909092, + "no_speech_prob": 0.0005178684368729591, + "confidence": 0.86, + "words": [ + { + "text": "What", + "start": 115.52, + "end": 116.54, + "confidence": 0.67 + }, + { + "text": "are", + "start": 116.54, + "end": 116.58, + "confidence": 0.788 + }, + { + "text": "you", + "start": 116.58, + "end": 116.64, + "confidence": 0.984 + }, + { + "text": "telling", + "start": 116.64, + "end": 116.68, + "confidence": 0.852 + }, + { + "text": "me,", + "start": 116.68, + "end": 117.44, + "confidence": 0.947 + }, + { + "text": "dude?", + "start": 117.44, + "end": 117.54, + "confidence": 0.966 + } + ] + }, + { + "id": 53, + "seek": 11000, + "start": 118.18, + "end": 120.14, + "text": " What are you telling me, dude?", + "tokens": [ + 708, + 366, + 291, + 3585, + 385, + 11, + 6449, + 30 + ], + "temperature": 0.0, + "avg_logprob": -0.1162933564521897, + "compression_ratio": 9.840909090909092, + "no_speech_prob": 0.0005178684368729591, + "confidence": 0.88, + "words": [ + { + "text": "What", + "start": 118.18, + "end": 118.36, + "confidence": 0.758 + }, + { + "text": "are", + "start": 118.36, + "end": 118.4, + "confidence": 0.789 + }, + { + "text": "you", + "start": 118.4, + "end": 118.74, + "confidence": 0.985 + }, + { + "text": "telling", + "start": 118.74, + "end": 118.82, + "confidence": 0.858 + }, + { + "text": "me,", + "start": 118.82, + "end": 120.1, + "confidence": 0.948 + }, + { + "text": "dude?", + "start": 120.1, + "end": 120.14, + "confidence": 0.968 + } + ] + }, + { + "id": 54, + "seek": 11000, + "start": 120.14, + "end": 120.38, + "text": " What are you telling me, dude?", + "tokens": [ + 708, + 366, + 291, + 3585, + 385, + 11, + 6449, + 30 + ], + "temperature": 0.0, + "avg_logprob": -0.1162933564521897, + "compression_ratio": 9.840909090909092, + "no_speech_prob": 0.0005178684368729591, + "confidence": 0.884, + "words": [ + { + "text": "What", + "start": 120.14, + "end": 120.18, + "confidence": 0.757 + }, + { + "text": "are", + "start": 120.18, + "end": 120.22, + "confidence": 0.808 + }, + { + "text": "you", + "start": 120.22, + "end": 120.26, + "confidence": 0.986 + }, + { + "text": "telling", + "start": 120.26, + "end": 120.3, + "confidence": 0.857 + }, + { + "text": "me,", + "start": 120.3, + "end": 120.34, + "confidence": 0.954 + }, + { + "text": "dude?", + "start": 120.34, + "end": 120.38, + "confidence": 0.966 + } + ] + }, + { + "id": 55, + "seek": 11000, + "start": 121.52, + "end": 123.36, + "text": " What are you telling me, dude?", + "tokens": [ + 708, + 366, + 291, + 3585, + 385, + 11, + 6449, + 30 + ], + "temperature": 0.0, + "avg_logprob": -0.1162933564521897, + "compression_ratio": 9.840909090909092, + "no_speech_prob": 0.0005178684368729591, + "confidence": 0.874, + "words": [ + { + "text": "What", + "start": 121.52, + "end": 122.72, + "confidence": 0.718 + }, + { + "text": "are", + "start": 122.72, + "end": 123.2, + "confidence": 0.788 + }, + { + "text": "you", + "start": 123.2, + "end": 123.24, + "confidence": 0.986 + }, + { + "text": "telling", + "start": 123.24, + "end": 123.28, + "confidence": 0.865 + }, + { + "text": "me,", + "start": 123.28, + "end": 123.32, + "confidence": 0.952 + }, + { + "text": "dude?", + "start": 123.32, + "end": 123.36, + "confidence": 0.968 + } + ] + }, + { + "id": 56, + "seek": 11000, + "start": 123.52, + "end": 125.14, + "text": " What are you telling me, dude?", + "tokens": [ + 708, + 366, + 291, + 3585, + 385, + 11, + 6449, + 30 + ], + "temperature": 0.0, + "avg_logprob": -0.1162933564521897, + "compression_ratio": 9.840909090909092, + "no_speech_prob": 0.0005178684368729591, + "confidence": 0.882, + "words": [ + { + "text": "What", + "start": 123.52, + "end": 124.56, + "confidence": 0.718 + }, + { + "text": "are", + "start": 124.56, + "end": 124.74, + "confidence": 0.821 + }, + { + "text": "you", + "start": 124.74, + "end": 125.02, + "confidence": 0.989 + }, + { + "text": "telling", + "start": 125.02, + "end": 125.06, + "confidence": 0.878 + }, + { + "text": "me,", + "start": 125.06, + "end": 125.1, + "confidence": 0.952 + }, + { + "text": "dude?", + "start": 125.1, + "end": 125.14, + "confidence": 0.968 + } + ] + }, + { + "id": 57, + "seek": 11000, + "start": 125.52, + "end": 127.58, + "text": " What are you telling me, dude?", + "tokens": [ + 708, + 366, + 291, + 3585, + 385, + 11, + 6449, + 30 + ], + "temperature": 0.0, + "avg_logprob": -0.1162933564521897, + "compression_ratio": 9.840909090909092, + "no_speech_prob": 0.0005178684368729591, + "confidence": 0.894, + "words": [ + { + "text": "What", + "start": 125.52, + "end": 126.58, + "confidence": 0.747 + }, + { + "text": "are", + "start": 126.58, + "end": 126.9, + "confidence": 0.837 + }, + { + "text": "you", + "start": 126.9, + "end": 127.06, + "confidence": 0.991 + }, + { + "text": "telling", + "start": 127.06, + "end": 127.14, + "confidence": 0.883 + }, + { + "text": "me,", + "start": 127.14, + "end": 127.54, + "confidence": 0.962 + }, + { + "text": "dude?", + "start": 127.54, + "end": 127.58, + "confidence": 0.969 + } + ] + }, + { + "id": 58, + "seek": 11000, + "start": 127.58, + "end": 129.28, + "text": " What are you telling me, dude?", + "tokens": [ + 708, + 366, + 291, + 3585, + 385, + 11, + 6449, + 30 + ], + "temperature": 0.0, + "avg_logprob": -0.1162933564521897, + "compression_ratio": 9.840909090909092, + "no_speech_prob": 0.0005178684368729591, + "confidence": 0.895, + "words": [ + { + "text": "What", + "start": 127.58, + "end": 128.98, + "confidence": 0.719 + }, + { + "text": "are", + "start": 128.98, + "end": 129.02, + "confidence": 0.859 + }, + { + "text": "you", + "start": 129.02, + "end": 129.06, + "confidence": 0.992 + }, + { + "text": "telling", + "start": 129.06, + "end": 129.1, + "confidence": 0.896 + }, + { + "text": "me,", + "start": 129.1, + "end": 129.14, + "confidence": 0.965 + }, + { + "text": "dude?", + "start": 129.14, + "end": 129.28, + "confidence": 0.971 + } + ] + }, + { + "id": 59, + "seek": 11000, + "start": 129.72, + "end": 131.68, + "text": " What are you telling me, dude?", + "tokens": [ + 708, + 366, + 291, + 3585, + 385, + 11, + 6449, + 30 + ], + "temperature": 0.0, + "avg_logprob": -0.1162933564521897, + "compression_ratio": 9.840909090909092, + "no_speech_prob": 0.0005178684368729591, + "confidence": 0.89, + "words": [ + { + "text": "What", + "start": 129.72, + "end": 131.02, + "confidence": 0.703 + }, + { + "text": "are", + "start": 131.02, + "end": 131.46, + "confidence": 0.855 + }, + { + "text": "you", + "start": 131.46, + "end": 131.5, + "confidence": 0.992 + }, + { + "text": "telling", + "start": 131.5, + "end": 131.54, + "confidence": 0.89 + }, + { + "text": "me,", + "start": 131.54, + "end": 131.64, + "confidence": 0.964 + }, + { + "text": "dude?", + "start": 131.64, + "end": 131.68, + "confidence": 0.97 + } + ] + }, + { + "id": 60, + "seek": 11000, + "start": 131.68, + "end": 133.0, + "text": " What are you telling me, dude?", + "tokens": [ + 708, + 366, + 291, + 3585, + 385, + 11, + 6449, + 30 + ], + "temperature": 0.0, + "avg_logprob": -0.1162933564521897, + "compression_ratio": 9.840909090909092, + "no_speech_prob": 0.0005178684368729591, + "confidence": 0.903, + "words": [ + { + "text": "What", + "start": 131.68, + "end": 132.36, + "confidence": 0.746 + }, + { + "text": "are", + "start": 132.36, + "end": 132.4, + "confidence": 0.86 + }, + { + "text": "you", + "start": 132.4, + "end": 132.44, + "confidence": 0.993 + }, + { + "text": "telling", + "start": 132.44, + "end": 132.48, + "confidence": 0.903 + }, + { + "text": "me,", + "start": 132.48, + "end": 132.52, + "confidence": 0.969 + }, + { + "text": "dude?", + "start": 132.52, + "end": 133.0, + "confidence": 0.972 + } + ] + }, + { + "id": 61, + "seek": 11000, + "start": 133.72, + "end": 135.54, + "text": " What are you telling me, dude?", + "tokens": [ + 708, + 366, + 291, + 3585, + 385, + 11, + 6449, + 30 + ], + "temperature": 0.0, + "avg_logprob": -0.1162933564521897, + "compression_ratio": 9.840909090909092, + "no_speech_prob": 0.0005178684368729591, + "confidence": 0.891, + "words": [ + { + "text": "What", + "start": 133.72, + "end": 134.08, + "confidence": 0.692 + }, + { + "text": "are", + "start": 134.08, + "end": 134.14, + "confidence": 0.859 + }, + { + "text": "you", + "start": 134.14, + "end": 134.38, + "confidence": 0.993 + }, + { + "text": "telling", + "start": 134.38, + "end": 134.42, + "confidence": 0.9 + }, + { + "text": "me,", + "start": 134.42, + "end": 135.5, + "confidence": 0.971 + }, + { + "text": "dude?", + "start": 135.5, + "end": 135.54, + "confidence": 0.974 + } + ] + }, + { + "id": 62, + "seek": 11000, + "start": 135.54, + "end": 136.88, + "text": " What are you telling me, dude?", + "tokens": [ + 708, + 366, + 291, + 3585, + 385, + 11, + 6449, + 30 + ], + "temperature": 0.0, + "avg_logprob": -0.1162933564521897, + "compression_ratio": 9.840909090909092, + "no_speech_prob": 0.0005178684368729591, + "confidence": 0.855, + "words": [ + { + "text": "What", + "start": 135.54, + "end": 135.58, + "confidence": 0.534 + }, + { + "text": "are", + "start": 135.58, + "end": 135.62, + "confidence": 0.856 + }, + { + "text": "you", + "start": 135.62, + "end": 135.66, + "confidence": 0.993 + }, + { + "text": "telling", + "start": 135.66, + "end": 135.7, + "confidence": 0.906 + }, + { + "text": "me,", + "start": 135.7, + "end": 135.74, + "confidence": 0.972 + }, + { + "text": "dude?", + "start": 135.74, + "end": 136.88, + "confidence": 0.975 + } + ] + } + ], + "language": "en" +} \ No newline at end of file diff --git a/tests/expected/tiny_auto.cpu/smartphone.mp3.words.json b/tests/expected/tiny_auto.cpu/smartphone.mp3.words.json new file mode 100644 index 0000000000000000000000000000000000000000..f90643caf0519b49ba0cbc0381cd8d8ced1f218b --- /dev/null +++ b/tests/expected/tiny_auto.cpu/smartphone.mp3.words.json @@ -0,0 +1,5038 @@ +{ + "text": " C'est évidence que dit Nicolas. Mais je me l'étais jamais formulé comme ça. Ce qui fait la force du smartphone, c'est pas seulement la cumulation des fonctions, mais la manière dans quelques interagues entraîne. Et il est d'ailleurs, c'est la photo c'est hyper convaincant. Alors évidemment, il faudrait ajouter les interfaces les grand-attêtes qu'il a été beaucoup très souvent ementionné. Mais bon, il faudrait que les profites aussi de 20 ans pendant l'été, les ordinateurs nous ont appris à piquer sur des icônes. C'est ce que le smartphone ajoute le toucher, qui rend le contact plus direct, plus sensible. Et puis, évidemment, il faudrait parler aussi des applications qui permettent de contourner le côté tout flu de la navigation web pour aller directement en but. Bref, tout ça, ce sont les conditions qui permettent de créer cette objet, en Nicolas, dit qu'il est très fondablement inédit dans l'histoire de l'humanité. Mais ça s'assoulait d'une autre interrogation. Est-ce que le fait que cette objet soit inédit un d'huies que notre rapport a lui est aussi un rapport inédit? Je veux dire, est-ce que le rapport qu'on a au sein de foi n'est comparable à celui qu'on entretenait à d'autres objectes techniques comme la voiture ou le téléphone? Il n'y a pas d'équivalent. On s'est espécie de nous voter dans la relation à l'objet. C'est facilement éterréciant parce qu'on a impression de, comme le 10, les utilisateurs et les efforts, elles aident dépendant de cette objet d'un lieu, en fait, une espèce de relation de médiation avec le monde qui rendent un peu avec la même sédiforme de le jeu. Donc, à objets inédits, rapport inédits. Et, ce rapport, si j'en prends Nicolas, frère caractérisée par un mélange de dépenses et de rojets. Bon, en vrai, il faudrait remonter très très finement toute l'histoire des objectes techniques et de leur infération dans le vie pour déterminer si ce rapport est totalement inédit. Mais j'ai l'impression comme ça que Nicolas se trompe pas vraiment. Pour autant, je sache. Il y a eu plein de discussions autour de la voiture ou même du téléphone. Mais la dépense n'était pas du même mort, donc le rejet n'en plus n'était pas du même mort. On peut adorer sa bagnure, en avoir besoin pour plein de choses. Et là, le soir, quand on va se coucher, on la laisse. On l'a pas dans la main, quand on est collis, quand on n'en mène pas au chiot. On pouvait être émervé par son mome qui occupeait la ligne de téléphone pendant une heure chaque soir pour discuter avec un copain. Mais ça ne ressemble pas à ce qu'on peut ressentir à voir même mome aujourd'hui continuuellement avec son smartphone dans la main, comme c'était une sorte de estimateur extère de l'intempis de lâcher à l'éantrénée, ça m'a eu immédiate. Bon, je dis ça pour le mome, mais évidemment, va là pour nos aussi. Donc, rapport immédiate d'accord. Mais pourquoi, à ton impression qu'on en sortira jamais? Et puis, il faut en remettre la faute sur les gens qui ont créé cette route merveilleux et diabolique, qui a dit à bollique par coeur, merveilleux. Les économistes parlent de dépendance du santé. Ces vidéos, en fait, on est un santé qui a été établie, c'est un soit mon termine, soit définissant des beurs, on définisse un signalétique.", + "segments": [ + { + "id": 0, + "seek": 0, + "start": 0.42, + "end": 1.38, + "text": " C'est évidence que dit Nicolas.", + "tokens": [ + 383, + 6, + 377, + 20090, + 2778, + 631, + 6176, + 38268, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.566579490710216, + "compression_ratio": 1.605421686746988, + "no_speech_prob": 0.14170263707637787, + "confidence": 0.625, + "words": [ + { + "text": "C'est", + "start": 0.42, + "end": 0.66, + "confidence": 0.849 + }, + { + "text": "évidence", + "start": 0.66, + "end": 0.94, + "confidence": 0.368 + }, + { + "text": "que", + "start": 0.94, + "end": 1.06, + "confidence": 0.883 + }, + { + "text": "dit", + "start": 1.06, + "end": 1.16, + "confidence": 0.344 + }, + { + "text": "Nicolas.", + "start": 1.16, + "end": 1.38, + "confidence": 0.921 + } + ] + }, + { + "id": 1, + "seek": 0, + "start": 1.66, + "end": 3.62, + "text": " Mais je me l'étais jamais formulé comme ça.", + "tokens": [ + 6313, + 1506, + 385, + 287, + 6, + 22824, + 14540, + 1254, + 425, + 526, + 5173, + 2788, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.566579490710216, + "compression_ratio": 1.605421686746988, + "no_speech_prob": 0.14170263707637787, + "confidence": 0.745, + "words": [ + { + "text": "Mais", + "start": 1.66, + "end": 1.9, + "confidence": 0.956 + }, + { + "text": "je", + "start": 1.9, + "end": 2.18, + "confidence": 0.629 + }, + { + "text": "me", + "start": 2.18, + "end": 2.3, + "confidence": 0.943 + }, + { + "text": "l'étais", + "start": 2.3, + "end": 2.54, + "confidence": 0.708 + }, + { + "text": "jamais", + "start": 2.54, + "end": 2.78, + "confidence": 0.962 + }, + { + "text": "formulé", + "start": 2.78, + "end": 3.2, + "confidence": 0.541 + }, + { + "text": "comme", + "start": 3.2, + "end": 3.34, + "confidence": 0.975 + }, + { + "text": "ça.", + "start": 3.34, + "end": 3.62, + "confidence": 0.979 + } + ] + }, + { + "id": 2, + "seek": 0, + "start": 4.14, + "end": 8.82, + "text": " Ce qui fait la force du smartphone, c'est pas seulement la cumulation des fonctions, mais la manière", + "tokens": [ + 8257, + 1956, + 3887, + 635, + 3464, + 1581, + 13307, + 11, + 269, + 6, + 377, + 1736, + 27772, + 635, + 12713, + 2776, + 730, + 17290, + 3916, + 11, + 2420, + 635, + 22267 + ], + "temperature": 0.0, + "avg_logprob": -0.566579490710216, + "compression_ratio": 1.605421686746988, + "no_speech_prob": 0.14170263707637787, + "confidence": 0.762, + "words": [ + { + "text": "Ce", + "start": 4.14, + "end": 4.22, + "confidence": 0.39 + }, + { + "text": "qui", + "start": 4.22, + "end": 4.34, + "confidence": 0.934 + }, + { + "text": "fait", + "start": 4.34, + "end": 4.46, + "confidence": 0.735 + }, + { + "text": "la", + "start": 4.46, + "end": 4.56, + "confidence": 0.988 + }, + { + "text": "force", + "start": 4.56, + "end": 4.96, + "confidence": 0.933 + }, + { + "text": "du", + "start": 4.96, + "end": 5.16, + "confidence": 0.936 + }, + { + "text": "smartphone,", + "start": 5.16, + "end": 5.74, + "confidence": 0.909 + }, + { + "text": "c'est", + "start": 5.74, + "end": 6.12, + "confidence": 0.871 + }, + { + "text": "pas", + "start": 6.12, + "end": 6.2, + "confidence": 0.982 + }, + { + "text": "seulement", + "start": 6.2, + "end": 6.52, + "confidence": 0.991 + }, + { + "text": "la", + "start": 6.52, + "end": 6.76, + "confidence": 0.627 + }, + { + "text": "cumulation", + "start": 6.76, + "end": 7.18, + "confidence": 0.679 + }, + { + "text": "des", + "start": 7.18, + "end": 7.54, + "confidence": 0.752 + }, + { + "text": "fonctions,", + "start": 7.54, + "end": 8.1, + "confidence": 0.826 + }, + { + "text": "mais", + "start": 8.1, + "end": 8.42, + "confidence": 0.511 + }, + { + "text": "la", + "start": 8.42, + "end": 8.58, + "confidence": 0.717 + }, + { + "text": "manière", + "start": 8.58, + "end": 8.82, + "confidence": 0.457 + } + ] + }, + { + "id": 3, + "seek": 0, + "start": 8.9, + "end": 10.84, + "text": " dans quelques interagues entraîne.", + "tokens": [ + 2680, + 16597, + 728, + 559, + 1247, + 22284, + 24741, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.566579490710216, + "compression_ratio": 1.605421686746988, + "no_speech_prob": 0.14170263707637787, + "confidence": 0.3, + "words": [ + { + "text": "dans", + "start": 8.9, + "end": 9.04, + "confidence": 0.329 + }, + { + "text": "quelques", + "start": 9.04, + "end": 9.26, + "confidence": 0.282 + }, + { + "text": "interagues", + "start": 9.26, + "end": 10.18, + "confidence": 0.238 + }, + { + "text": "entraîne.", + "start": 10.18, + "end": 10.84, + "confidence": 0.421 + } + ] + }, + { + "id": 4, + "seek": 0, + "start": 11.04, + "end": 12.92, + "text": " Et il est d'ailleurs, c'est la photo c'est hyper convaincant.", + "tokens": [ + 3790, + 1930, + 871, + 274, + 6, + 19400, + 11, + 269, + 6, + 377, + 635, + 5052, + 269, + 6, + 377, + 9848, + 3754, + 491, + 66, + 394, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.566579490710216, + "compression_ratio": 1.605421686746988, + "no_speech_prob": 0.14170263707637787, + "confidence": 0.625, + "words": [ + { + "text": "Et", + "start": 11.04, + "end": 11.1, + "confidence": 0.394 + }, + { + "text": "il", + "start": 11.1, + "end": 11.24, + "confidence": 0.128 + }, + { + "text": "est", + "start": 11.24, + "end": 11.38, + "confidence": 0.237 + }, + { + "text": "d'ailleurs,", + "start": 11.38, + "end": 11.62, + "confidence": 0.904 + }, + { + "text": "c'est", + "start": 11.62, + "end": 11.78, + "confidence": 0.879 + }, + { + "text": "la", + "start": 11.78, + "end": 11.82, + "confidence": 0.968 + }, + { + "text": "photo", + "start": 11.82, + "end": 11.92, + "confidence": 0.811 + }, + { + "text": "c'est", + "start": 11.92, + "end": 12.18, + "confidence": 0.792 + }, + { + "text": "hyper", + "start": 12.18, + "end": 12.38, + "confidence": 0.939 + }, + { + "text": "convaincant.", + "start": 12.38, + "end": 12.92, + "confidence": 0.494 + } + ] + }, + { + "id": 5, + "seek": 0, + "start": 13.26, + "end": 18.03, + "text": " Alors évidemment, il faudrait ajouter les interfaces les grand-attêtes qu'il a été beaucoup", + "tokens": [ + 9946, + 24724, + 11, + 1930, + 38694, + 8645, + 17680, + 23985, + 1512, + 28416, + 1512, + 2697, + 12, + 1591, + 38262, + 421, + 6, + 388, + 257, + 8862, + 8796 + ], + "temperature": 0.0, + "avg_logprob": -0.566579490710216, + "compression_ratio": 1.605421686746988, + "no_speech_prob": 0.14170263707637787, + "confidence": 0.553, + "words": [ + { + "text": "Alors", + "start": 13.26, + "end": 13.48, + "confidence": 0.904 + }, + { + "text": "évidemment,", + "start": 13.48, + "end": 13.92, + "confidence": 0.785 + }, + { + "text": "il", + "start": 13.92, + "end": 14.4, + "confidence": 0.961 + }, + { + "text": "faudrait", + "start": 14.4, + "end": 14.76, + "confidence": 0.85 + }, + { + "text": "ajouter", + "start": 14.76, + "end": 15.38, + "confidence": 0.874 + }, + { + "text": "les", + "start": 15.38, + "end": 15.62, + "confidence": 0.933 + }, + { + "text": "interfaces", + "start": 15.62, + "end": 15.86, + "confidence": 0.359 + }, + { + "text": "les", + "start": 15.86, + "end": 16.5, + "confidence": 0.414 + }, + { + "text": "grand-attêtes", + "start": 16.5, + "end": 16.94, + "confidence": 0.178 + }, + { + "text": "qu'il", + "start": 16.94, + "end": 17.18, + "confidence": 0.632 + }, + { + "text": "a", + "start": 17.18, + "end": 17.24, + "confidence": 0.969 + }, + { + "text": "été", + "start": 17.24, + "end": 17.5, + "confidence": 0.957 + }, + { + "text": "beaucoup", + "start": 17.5, + "end": 18.03, + "confidence": 0.572 + } + ] + }, + { + "id": 6, + "seek": 0, + "start": 18.03, + "end": 19.26, + "text": " très souvent ementionné.", + "tokens": [ + 5732, + 20847, + 846, + 1251, + 15055, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.566579490710216, + "compression_ratio": 1.605421686746988, + "no_speech_prob": 0.14170263707637787, + "confidence": 0.541, + "words": [ + { + "text": "très", + "start": 18.03, + "end": 18.66, + "confidence": 0.959 + }, + { + "text": "souvent", + "start": 18.66, + "end": 18.82, + "confidence": 0.994 + }, + { + "text": "ementionné.", + "start": 18.82, + "end": 19.26, + "confidence": 0.365 + } + ] + }, + { + "id": 7, + "seek": 0, + "start": 19.86, + "end": 23.54, + "text": " Mais bon, il faudrait que les profites aussi de 20 ans pendant l'été, les ordinateurs", + "tokens": [ + 6313, + 4428, + 11, + 1930, + 38694, + 8645, + 631, + 1512, + 1740, + 3324, + 6212, + 368, + 945, + 1567, + 17338, + 287, + 6, + 21210, + 11, + 1512, + 4792, + 13923, + 2156 + ], + "temperature": 0.0, + "avg_logprob": -0.566579490710216, + "compression_ratio": 1.605421686746988, + "no_speech_prob": 0.14170263707637787, + "confidence": 0.648, + "words": [ + { + "text": "Mais", + "start": 19.86, + "end": 20.22, + "confidence": 0.975 + }, + { + "text": "bon,", + "start": 20.22, + "end": 20.56, + "confidence": 0.479 + }, + { + "text": "il", + "start": 20.56, + "end": 20.6, + "confidence": 0.978 + }, + { + "text": "faudrait", + "start": 20.6, + "end": 20.74, + "confidence": 0.753 + }, + { + "text": "que", + "start": 20.74, + "end": 20.92, + "confidence": 0.378 + }, + { + "text": "les", + "start": 20.92, + "end": 20.98, + "confidence": 0.182 + }, + { + "text": "profites", + "start": 20.98, + "end": 21.26, + "confidence": 0.622 + }, + { + "text": "aussi", + "start": 21.26, + "end": 21.7, + "confidence": 0.502 + }, + { + "text": "de", + "start": 21.7, + "end": 21.84, + "confidence": 0.468 + }, + { + "text": "20", + "start": 21.84, + "end": 22.08, + "confidence": 0.924 + }, + { + "text": "ans", + "start": 22.08, + "end": 22.28, + "confidence": 0.937 + }, + { + "text": "pendant", + "start": 22.28, + "end": 22.46, + "confidence": 0.903 + }, + { + "text": "l'été,", + "start": 22.46, + "end": 22.96, + "confidence": 0.499 + }, + { + "text": "les", + "start": 22.96, + "end": 23.04, + "confidence": 0.861 + }, + { + "text": "ordinateurs", + "start": 23.04, + "end": 23.54, + "confidence": 0.934 + } + ] + }, + { + "id": 8, + "seek": 0, + "start": 23.58, + "end": 25.26, + "text": " nous ont appris à piquer sur des icônes.", + "tokens": [ + 4666, + 6592, + 724, + 5714, + 1531, + 280, + 23909, + 1022, + 730, + 4376, + 2851, + 4081, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.566579490710216, + "compression_ratio": 1.605421686746988, + "no_speech_prob": 0.14170263707637787, + "confidence": 0.663, + "words": [ + { + "text": "nous", + "start": 23.58, + "end": 23.74, + "confidence": 0.833 + }, + { + "text": "ont", + "start": 23.74, + "end": 23.86, + "confidence": 0.976 + }, + { + "text": "appris", + "start": 23.86, + "end": 24.06, + "confidence": 0.947 + }, + { + "text": "à", + "start": 24.06, + "end": 24.24, + "confidence": 0.24 + }, + { + "text": "piquer", + "start": 24.24, + "end": 24.42, + "confidence": 0.45 + }, + { + "text": "sur", + "start": 24.42, + "end": 24.68, + "confidence": 0.749 + }, + { + "text": "des", + "start": 24.68, + "end": 24.8, + "confidence": 0.96 + }, + { + "text": "icônes.", + "start": 24.8, + "end": 25.26, + "confidence": 0.656 + } + ] + }, + { + "id": 9, + "seek": 2556, + "start": 25.58, + "end": 30.56, + "text": " C'est ce que le smartphone ajoute le toucher, qui rend le contact plus direct, plus sensible.", + "tokens": [ + 383, + 6, + 377, + 1769, + 631, + 476, + 13307, + 17680, + 14040, + 476, + 2557, + 260, + 11, + 1956, + 6125, + 476, + 3385, + 1804, + 2047, + 11, + 1804, + 25380, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.4095459938049316, + "compression_ratio": 1.7522658610271904, + "no_speech_prob": 0.0006256799097172916, + "confidence": 0.643, + "words": [ + { + "text": "C'est", + "start": 25.58, + "end": 25.66, + "confidence": 0.449 + }, + { + "text": "ce", + "start": 25.66, + "end": 25.72, + "confidence": 0.491 + }, + { + "text": "que", + "start": 25.72, + "end": 25.94, + "confidence": 0.935 + }, + { + "text": "le", + "start": 25.94, + "end": 26.6, + "confidence": 0.377 + }, + { + "text": "smartphone", + "start": 26.6, + "end": 26.86, + "confidence": 0.977 + }, + { + "text": "ajoute", + "start": 26.86, + "end": 27.42, + "confidence": 0.813 + }, + { + "text": "le", + "start": 27.42, + "end": 27.64, + "confidence": 0.957 + }, + { + "text": "toucher,", + "start": 27.64, + "end": 28.06, + "confidence": 0.73 + }, + { + "text": "qui", + "start": 28.06, + "end": 28.18, + "confidence": 0.209 + }, + { + "text": "rend", + "start": 28.18, + "end": 28.34, + "confidence": 0.877 + }, + { + "text": "le", + "start": 28.34, + "end": 28.68, + "confidence": 0.991 + }, + { + "text": "contact", + "start": 28.68, + "end": 28.96, + "confidence": 0.854 + }, + { + "text": "plus", + "start": 28.96, + "end": 29.48, + "confidence": 0.865 + }, + { + "text": "direct,", + "start": 29.48, + "end": 29.96, + "confidence": 0.692 + }, + { + "text": "plus", + "start": 29.96, + "end": 30.24, + "confidence": 0.928 + }, + { + "text": "sensible.", + "start": 30.24, + "end": 30.56, + "confidence": 0.332 + } + ] + }, + { + "id": 10, + "seek": 2556, + "start": 31.04, + "end": 34.34, + "text": " Et puis, évidemment, il faudrait parler aussi des applications qui permettent de contourner", + "tokens": [ + 3790, + 9093, + 11, + 24724, + 11, + 1930, + 38694, + 8645, + 16421, + 6212, + 730, + 5821, + 1956, + 21540, + 317, + 368, + 21234, + 1193 + ], + "temperature": 0.0, + "avg_logprob": -0.4095459938049316, + "compression_ratio": 1.7522658610271904, + "no_speech_prob": 0.0006256799097172916, + "confidence": 0.827, + "words": [ + { + "text": "Et", + "start": 31.04, + "end": 31.24, + "confidence": 0.914 + }, + { + "text": "puis,", + "start": 31.24, + "end": 31.34, + "confidence": 0.713 + }, + { + "text": "évidemment,", + "start": 31.34, + "end": 31.64, + "confidence": 0.378 + }, + { + "text": "il", + "start": 31.64, + "end": 31.78, + "confidence": 0.935 + }, + { + "text": "faudrait", + "start": 31.78, + "end": 31.88, + "confidence": 0.99 + }, + { + "text": "parler", + "start": 31.88, + "end": 32.12, + "confidence": 0.882 + }, + { + "text": "aussi", + "start": 32.12, + "end": 32.3, + "confidence": 0.889 + }, + { + "text": "des", + "start": 32.3, + "end": 32.44, + "confidence": 0.927 + }, + { + "text": "applications", + "start": 32.44, + "end": 32.78, + "confidence": 0.839 + }, + { + "text": "qui", + "start": 32.78, + "end": 33.16, + "confidence": 0.652 + }, + { + "text": "permettent", + "start": 33.16, + "end": 33.68, + "confidence": 0.951 + }, + { + "text": "de", + "start": 33.68, + "end": 33.9, + "confidence": 0.952 + }, + { + "text": "contourner", + "start": 33.9, + "end": 34.34, + "confidence": 0.787 + } + ] + }, + { + "id": 11, + "seek": 2556, + "start": 34.34, + "end": 37.72, + "text": " le côté tout flu de la navigation web pour aller directement en but.", + "tokens": [ + 476, + 18437, + 3486, + 5029, + 368, + 635, + 17346, + 3670, + 2016, + 8722, + 37297, + 465, + 457, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.4095459938049316, + "compression_ratio": 1.7522658610271904, + "no_speech_prob": 0.0006256799097172916, + "confidence": 0.766, + "words": [ + { + "text": "le", + "start": 34.34, + "end": 34.52, + "confidence": 0.989 + }, + { + "text": "côté", + "start": 34.52, + "end": 34.72, + "confidence": 0.983 + }, + { + "text": "tout", + "start": 34.72, + "end": 34.96, + "confidence": 0.954 + }, + { + "text": "flu", + "start": 34.96, + "end": 35.2, + "confidence": 0.548 + }, + { + "text": "de", + "start": 35.2, + "end": 35.42, + "confidence": 0.248 + }, + { + "text": "la", + "start": 35.42, + "end": 35.72, + "confidence": 0.902 + }, + { + "text": "navigation", + "start": 35.72, + "end": 36.04, + "confidence": 0.913 + }, + { + "text": "web", + "start": 36.04, + "end": 36.64, + "confidence": 0.93 + }, + { + "text": "pour", + "start": 36.64, + "end": 36.76, + "confidence": 0.746 + }, + { + "text": "aller", + "start": 36.76, + "end": 36.94, + "confidence": 0.992 + }, + { + "text": "directement", + "start": 36.94, + "end": 37.46, + "confidence": 0.986 + }, + { + "text": "en", + "start": 37.46, + "end": 37.68, + "confidence": 0.644 + }, + { + "text": "but.", + "start": 37.68, + "end": 37.72, + "confidence": 0.689 + } + ] + }, + { + "id": 12, + "seek": 2556, + "start": 37.72, + "end": 43.06, + "text": " Bref, tout ça, ce sont les conditions qui permettent de créer cette objet, en Nicolas,", + "tokens": [ + 49957, + 11, + 3486, + 2788, + 11, + 1769, + 4900, + 1512, + 4487, + 1956, + 21540, + 317, + 368, + 32062, + 5550, + 14964, + 11, + 465, + 38268, + 11 + ], + "temperature": 0.0, + "avg_logprob": -0.4095459938049316, + "compression_ratio": 1.7522658610271904, + "no_speech_prob": 0.0006256799097172916, + "confidence": 0.725, + "words": [ + { + "text": "Bref,", + "start": 37.72, + "end": 38.9, + "confidence": 0.967 + }, + { + "text": "tout", + "start": 38.9, + "end": 38.98, + "confidence": 0.786 + }, + { + "text": "ça,", + "start": 38.98, + "end": 39.36, + "confidence": 0.985 + }, + { + "text": "ce", + "start": 39.36, + "end": 39.68, + "confidence": 0.929 + }, + { + "text": "sont", + "start": 39.68, + "end": 39.84, + "confidence": 0.963 + }, + { + "text": "les", + "start": 39.84, + "end": 40.06, + "confidence": 0.976 + }, + { + "text": "conditions", + "start": 40.06, + "end": 40.54, + "confidence": 0.96 + }, + { + "text": "qui", + "start": 40.54, + "end": 40.9, + "confidence": 0.995 + }, + { + "text": "permettent", + "start": 40.9, + "end": 41.54, + "confidence": 0.986 + }, + { + "text": "de", + "start": 41.54, + "end": 41.58, + "confidence": 0.989 + }, + { + "text": "créer", + "start": 41.58, + "end": 41.92, + "confidence": 0.918 + }, + { + "text": "cette", + "start": 41.92, + "end": 42.3, + "confidence": 0.518 + }, + { + "text": "objet,", + "start": 42.3, + "end": 42.7, + "confidence": 0.213 + }, + { + "text": "en", + "start": 42.7, + "end": 42.8, + "confidence": 0.191 + }, + { + "text": "Nicolas,", + "start": 42.8, + "end": 43.06, + "confidence": 0.508 + } + ] + }, + { + "id": 13, + "seek": 2556, + "start": 43.1, + "end": 46.48, + "text": " dit qu'il est très fondablement inédit dans l'histoire de l'humanité.", + "tokens": [ + 6176, + 421, + 6, + 388, + 871, + 5732, + 9557, + 712, + 518, + 294, + 7811, + 270, + 2680, + 287, + 6, + 29093, + 368, + 287, + 6, + 18796, + 5066, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.4095459938049316, + "compression_ratio": 1.7522658610271904, + "no_speech_prob": 0.0006256799097172916, + "confidence": 0.768, + "words": [ + { + "text": "dit", + "start": 43.1, + "end": 43.52, + "confidence": 0.551 + }, + { + "text": "qu'il", + "start": 43.52, + "end": 43.68, + "confidence": 0.969 + }, + { + "text": "est", + "start": 43.68, + "end": 43.8, + "confidence": 0.851 + }, + { + "text": "très", + "start": 43.8, + "end": 43.94, + "confidence": 0.368 + }, + { + "text": "fondablement", + "start": 43.94, + "end": 44.68, + "confidence": 0.593 + }, + { + "text": "inédit", + "start": 44.68, + "end": 45.52, + "confidence": 0.66 + }, + { + "text": "dans", + "start": 45.52, + "end": 45.74, + "confidence": 0.778 + }, + { + "text": "l'histoire", + "start": 45.74, + "end": 45.98, + "confidence": 0.825 + }, + { + "text": "de", + "start": 45.98, + "end": 46.08, + "confidence": 0.978 + }, + { + "text": "l'humanité.", + "start": 46.08, + "end": 46.48, + "confidence": 0.991 + } + ] + }, + { + "id": 14, + "seek": 2556, + "start": 47.06, + "end": 48.76, + "text": " Mais ça s'assoulait d'une autre interrogation.", + "tokens": [ + 6313, + 2788, + 262, + 6, + 640, + 263, + 35235, + 274, + 6, + 2613, + 15081, + 24871, + 399, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.4095459938049316, + "compression_ratio": 1.7522658610271904, + "no_speech_prob": 0.0006256799097172916, + "confidence": 0.697, + "words": [ + { + "text": "Mais", + "start": 47.06, + "end": 47.16, + "confidence": 0.939 + }, + { + "text": "ça", + "start": 47.16, + "end": 47.46, + "confidence": 0.854 + }, + { + "text": "s'assoulait", + "start": 47.46, + "end": 47.78, + "confidence": 0.591 + }, + { + "text": "d'une", + "start": 47.78, + "end": 48.02, + "confidence": 0.619 + }, + { + "text": "autre", + "start": 48.02, + "end": 48.14, + "confidence": 0.966 + }, + { + "text": "interrogation.", + "start": 48.14, + "end": 48.76, + "confidence": 0.833 + } + ] + }, + { + "id": 15, + "seek": 2556, + "start": 49.26, + "end": 54.34, + "text": " Est-ce que le fait que cette objet soit inédit un d'huies que notre rapport a lui est aussi", + "tokens": [ + 4410, + 12, + 384, + 631, + 476, + 3887, + 631, + 5550, + 14964, + 12703, + 294, + 7811, + 270, + 517, + 274, + 6, + 12086, + 530, + 631, + 10349, + 18018, + 257, + 8783, + 871, + 6212 + ], + "temperature": 0.0, + "avg_logprob": -0.4095459938049316, + "compression_ratio": 1.7522658610271904, + "no_speech_prob": 0.0006256799097172916, + "confidence": 0.697, + "words": [ + { + "text": "Est-ce", + "start": 49.26, + "end": 49.7, + "confidence": 0.804 + }, + { + "text": "que", + "start": 49.7, + "end": 49.74, + "confidence": 0.989 + }, + { + "text": "le", + "start": 49.74, + "end": 49.78, + "confidence": 0.882 + }, + { + "text": "fait", + "start": 49.78, + "end": 49.96, + "confidence": 0.962 + }, + { + "text": "que", + "start": 49.96, + "end": 50.08, + "confidence": 0.935 + }, + { + "text": "cette", + "start": 50.08, + "end": 50.24, + "confidence": 0.95 + }, + { + "text": "objet", + "start": 50.24, + "end": 50.5, + "confidence": 0.968 + }, + { + "text": "soit", + "start": 50.5, + "end": 50.96, + "confidence": 0.991 + }, + { + "text": "inédit", + "start": 50.96, + "end": 51.78, + "confidence": 0.91 + }, + { + "text": "un", + "start": 51.78, + "end": 52.06, + "confidence": 0.442 + }, + { + "text": "d'huies", + "start": 52.06, + "end": 52.32, + "confidence": 0.298 + }, + { + "text": "que", + "start": 52.32, + "end": 52.4, + "confidence": 0.966 + }, + { + "text": "notre", + "start": 52.4, + "end": 52.58, + "confidence": 0.992 + }, + { + "text": "rapport", + "start": 52.58, + "end": 53.1, + "confidence": 0.714 + }, + { + "text": "a", + "start": 53.1, + "end": 53.44, + "confidence": 0.522 + }, + { + "text": "lui", + "start": 53.44, + "end": 53.62, + "confidence": 0.659 + }, + { + "text": "est", + "start": 53.62, + "end": 54.0, + "confidence": 0.643 + }, + { + "text": "aussi", + "start": 54.0, + "end": 54.34, + "confidence": 0.808 + } + ] + }, + { + "id": 16, + "seek": 2556, + "start": 54.34, + "end": 55.32, + "text": " un rapport inédit?", + "tokens": [ + 517, + 18018, + 294, + 7811, + 270, + 2506 + ], + "temperature": 0.0, + "avg_logprob": -0.4095459938049316, + "compression_ratio": 1.7522658610271904, + "no_speech_prob": 0.0006256799097172916, + "confidence": 0.849, + "words": [ + { + "text": "un", + "start": 54.34, + "end": 54.72, + "confidence": 0.506 + }, + { + "text": "rapport", + "start": 54.72, + "end": 54.94, + "confidence": 0.999 + }, + { + "text": "inédit?", + "start": 54.94, + "end": 55.32, + "confidence": 0.956 + } + ] + }, + { + "id": 17, + "seek": 5548, + "start": 55.6, + "end": 58.6, + "text": " Je veux dire, est-ce que le rapport qu'on a au sein de foi n'est comparable à celui", + "tokens": [ + 2588, + 16389, + 1264, + 11, + 871, + 12, + 384, + 631, + 476, + 18018, + 421, + 6, + 266, + 257, + 1609, + 6195, + 368, + 6901, + 297, + 6, + 377, + 6311, + 712, + 1531, + 22829 + ], + "temperature": 0.0, + "avg_logprob": -0.6093524909167556, + "compression_ratio": 1.6292834890965733, + "no_speech_prob": 6.752492481609806e-05, + "confidence": 0.626, + "words": [ + { + "text": "Je", + "start": 55.6, + "end": 55.84, + "confidence": 0.335 + }, + { + "text": "veux", + "start": 55.84, + "end": 55.94, + "confidence": 0.432 + }, + { + "text": "dire,", + "start": 55.94, + "end": 56.16, + "confidence": 0.992 + }, + { + "text": "est-ce", + "start": 56.16, + "end": 56.34, + "confidence": 0.951 + }, + { + "text": "que", + "start": 56.34, + "end": 56.4, + "confidence": 0.973 + }, + { + "text": "le", + "start": 56.4, + "end": 56.54, + "confidence": 0.987 + }, + { + "text": "rapport", + "start": 56.54, + "end": 56.76, + "confidence": 0.999 + }, + { + "text": "qu'on", + "start": 56.76, + "end": 57.1, + "confidence": 0.906 + }, + { + "text": "a", + "start": 57.1, + "end": 57.14, + "confidence": 0.974 + }, + { + "text": "au", + "start": 57.14, + "end": 57.26, + "confidence": 0.319 + }, + { + "text": "sein", + "start": 57.26, + "end": 57.36, + "confidence": 0.244 + }, + { + "text": "de", + "start": 57.36, + "end": 57.44, + "confidence": 0.177 + }, + { + "text": "foi", + "start": 57.44, + "end": 57.54, + "confidence": 0.163 + }, + { + "text": "n'est", + "start": 57.54, + "end": 57.78, + "confidence": 0.777 + }, + { + "text": "comparable", + "start": 57.78, + "end": 58.32, + "confidence": 0.606 + }, + { + "text": "à", + "start": 58.32, + "end": 58.46, + "confidence": 0.482 + }, + { + "text": "celui", + "start": 58.46, + "end": 58.6, + "confidence": 0.831 + } + ] + }, + { + "id": 18, + "seek": 5548, + "start": 58.72, + "end": 62.81, + "text": " qu'on entretenait à d'autres objectes techniques comme la voiture ou le téléphone?", + "tokens": [ + 421, + 6, + 266, + 3962, + 1147, + 1001, + 1531, + 274, + 6, + 16752, + 2657, + 279, + 7512, + 5173, + 635, + 38859, + 2820, + 476, + 47159, + 2506 + ], + "temperature": 0.0, + "avg_logprob": -0.6093524909167556, + "compression_ratio": 1.6292834890965733, + "no_speech_prob": 6.752492481609806e-05, + "confidence": 0.781, + "words": [ + { + "text": "qu'on", + "start": 58.72, + "end": 58.88, + "confidence": 0.941 + }, + { + "text": "entretenait", + "start": 58.88, + "end": 59.38, + "confidence": 0.657 + }, + { + "text": "à", + "start": 59.38, + "end": 59.44, + "confidence": 0.973 + }, + { + "text": "d'autres", + "start": 59.44, + "end": 59.64, + "confidence": 0.909 + }, + { + "text": "objectes", + "start": 59.64, + "end": 60.02, + "confidence": 0.528 + }, + { + "text": "techniques", + "start": 60.02, + "end": 60.38, + "confidence": 0.547 + }, + { + "text": "comme", + "start": 60.38, + "end": 60.86, + "confidence": 0.662 + }, + { + "text": "la", + "start": 60.86, + "end": 61.46, + "confidence": 0.898 + }, + { + "text": "voiture", + "start": 61.46, + "end": 61.8, + "confidence": 0.954 + }, + { + "text": "ou", + "start": 61.8, + "end": 62.32, + "confidence": 0.74 + }, + { + "text": "le", + "start": 62.32, + "end": 62.6, + "confidence": 0.847 + }, + { + "text": "téléphone?", + "start": 62.6, + "end": 62.81, + "confidence": 0.979 + } + ] + }, + { + "id": 19, + "seek": 5548, + "start": 62.81, + "end": 66.07, + "text": " Il n'y a pas d'équivalent.", + "tokens": [ + 4416, + 297, + 6, + 88, + 257, + 1736, + 274, + 6, + 20183, + 3576, + 317, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.6093524909167556, + "compression_ratio": 1.6292834890965733, + "no_speech_prob": 6.752492481609806e-05, + "confidence": 0.882, + "words": [ + { + "text": "Il", + "start": 62.81, + "end": 65.42, + "confidence": 0.866 + }, + { + "text": "n'y", + "start": 65.42, + "end": 65.52, + "confidence": 0.865 + }, + { + "text": "a", + "start": 65.52, + "end": 65.56, + "confidence": 0.965 + }, + { + "text": "pas", + "start": 65.56, + "end": 65.62, + "confidence": 0.998 + }, + { + "text": "d'équivalent.", + "start": 65.62, + "end": 66.07, + "confidence": 0.858 + } + ] + }, + { + "id": 20, + "seek": 5548, + "start": 66.07, + "end": 69.74, + "text": " On s'est espécie de nous voter dans la relation à l'objet.", + "tokens": [ + 1282, + 262, + 6, + 377, + 7089, + 526, + 4260, + 368, + 4666, + 21722, + 2680, + 635, + 9721, + 1531, + 287, + 6, + 996, + 7108, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.6093524909167556, + "compression_ratio": 1.6292834890965733, + "no_speech_prob": 6.752492481609806e-05, + "confidence": 0.552, + "words": [ + { + "text": "On", + "start": 66.07, + "end": 67.0, + "confidence": 0.29 + }, + { + "text": "s'est", + "start": 67.0, + "end": 67.26, + "confidence": 0.562 + }, + { + "text": "espécie", + "start": 67.26, + "end": 67.46, + "confidence": 0.233 + }, + { + "text": "de", + "start": 67.46, + "end": 67.58, + "confidence": 0.963 + }, + { + "text": "nous", + "start": 67.58, + "end": 67.8, + "confidence": 0.631 + }, + { + "text": "voter", + "start": 67.8, + "end": 68.24, + "confidence": 0.241 + }, + { + "text": "dans", + "start": 68.24, + "end": 68.68, + "confidence": 0.853 + }, + { + "text": "la", + "start": 68.68, + "end": 68.88, + "confidence": 0.61 + }, + { + "text": "relation", + "start": 68.88, + "end": 69.22, + "confidence": 0.932 + }, + { + "text": "à", + "start": 69.22, + "end": 69.34, + "confidence": 0.792 + }, + { + "text": "l'objet.", + "start": 69.34, + "end": 69.74, + "confidence": 0.889 + } + ] + }, + { + "id": 21, + "seek": 5548, + "start": 70.18, + "end": 74.78, + "text": " C'est facilement éterréciant parce qu'on a impression de, comme le 10, les utilisateurs", + "tokens": [ + 383, + 6, + 377, + 23670, + 518, + 1136, + 391, + 10521, + 537, + 394, + 6992, + 421, + 6, + 266, + 257, + 9995, + 368, + 11, + 5173, + 476, + 1266, + 11, + 1512, + 33643, + 25929 + ], + "temperature": 0.0, + "avg_logprob": -0.6093524909167556, + "compression_ratio": 1.6292834890965733, + "no_speech_prob": 6.752492481609806e-05, + "confidence": 0.491, + "words": [ + { + "text": "C'est", + "start": 70.18, + "end": 70.34, + "confidence": 0.907 + }, + { + "text": "facilement", + "start": 70.34, + "end": 70.72, + "confidence": 0.527 + }, + { + "text": "éterréciant", + "start": 70.72, + "end": 71.56, + "confidence": 0.277 + }, + { + "text": "parce", + "start": 71.56, + "end": 71.82, + "confidence": 0.298 + }, + { + "text": "qu'on", + "start": 71.82, + "end": 72.3, + "confidence": 0.775 + }, + { + "text": "a", + "start": 72.3, + "end": 72.4, + "confidence": 0.563 + }, + { + "text": "impression", + "start": 72.4, + "end": 72.74, + "confidence": 0.148 + }, + { + "text": "de,", + "start": 72.74, + "end": 73.36, + "confidence": 0.211 + }, + { + "text": "comme", + "start": 73.36, + "end": 73.8, + "confidence": 0.843 + }, + { + "text": "le", + "start": 73.8, + "end": 73.96, + "confidence": 0.9 + }, + { + "text": "10,", + "start": 73.96, + "end": 74.28, + "confidence": 0.395 + }, + { + "text": "les", + "start": 74.28, + "end": 74.32, + "confidence": 0.581 + }, + { + "text": "utilisateurs", + "start": 74.32, + "end": 74.78, + "confidence": 0.745 + } + ] + }, + { + "id": 22, + "seek": 5548, + "start": 74.8, + "end": 77.93, + "text": " et les efforts, elles aident dépendant de cette objet d'un lieu, en fait, une espèce de", + "tokens": [ + 1030, + 1512, + 6484, + 11, + 23576, + 257, + 1078, + 45768, + 394, + 368, + 5550, + 14964, + 274, + 6, + 409, + 26036, + 11, + 465, + 3887, + 11, + 2251, + 7089, + 30236, + 368 + ], + "temperature": 0.0, + "avg_logprob": -0.6093524909167556, + "compression_ratio": 1.6292834890965733, + "no_speech_prob": 6.752492481609806e-05, + "confidence": 0.464, + "words": [ + { + "text": "et", + "start": 74.8, + "end": 74.92, + "confidence": 0.147 + }, + { + "text": "les", + "start": 74.92, + "end": 74.96, + "confidence": 0.242 + }, + { + "text": "efforts,", + "start": 74.96, + "end": 75.22, + "confidence": 0.108 + }, + { + "text": "elles", + "start": 75.22, + "end": 75.32, + "confidence": 0.108 + }, + { + "text": "aident", + "start": 75.32, + "end": 75.44, + "confidence": 0.289 + }, + { + "text": "dépendant", + "start": 75.44, + "end": 76.0, + "confidence": 0.576 + }, + { + "text": "de", + "start": 76.0, + "end": 76.16, + "confidence": 0.301 + }, + { + "text": "cette", + "start": 76.16, + "end": 76.2, + "confidence": 0.519 + }, + { + "text": "objet", + "start": 76.2, + "end": 76.48, + "confidence": 0.961 + }, + { + "text": "d'un", + "start": 76.48, + "end": 76.86, + "confidence": 0.883 + }, + { + "text": "lieu,", + "start": 76.86, + "end": 77.06, + "confidence": 0.333 + }, + { + "text": "en", + "start": 77.06, + "end": 77.18, + "confidence": 0.837 + }, + { + "text": "fait,", + "start": 77.18, + "end": 77.42, + "confidence": 0.958 + }, + { + "text": "une", + "start": 77.42, + "end": 77.46, + "confidence": 0.57 + }, + { + "text": "espèce", + "start": 77.46, + "end": 77.74, + "confidence": 0.961 + }, + { + "text": "de", + "start": 77.74, + "end": 77.93, + "confidence": 0.601 + } + ] + }, + { + "id": 23, + "seek": 5548, + "start": 77.93, + "end": 82.98, + "text": " relation de médiation avec le monde qui rendent un peu avec la même sédiforme de", + "tokens": [ + 9721, + 368, + 42436, + 399, + 4163, + 476, + 10431, + 1956, + 6125, + 317, + 517, + 5604, + 4163, + 635, + 5698, + 262, + 7811, + 8629, + 68, + 368 + ], + "temperature": 0.0, + "avg_logprob": -0.6093524909167556, + "compression_ratio": 1.6292834890965733, + "no_speech_prob": 6.752492481609806e-05, + "confidence": 0.556, + "words": [ + { + "text": "relation", + "start": 77.93, + "end": 78.32, + "confidence": 0.839 + }, + { + "text": "de", + "start": 78.32, + "end": 78.7, + "confidence": 0.723 + }, + { + "text": "médiation", + "start": 78.7, + "end": 79.4, + "confidence": 0.872 + }, + { + "text": "avec", + "start": 79.4, + "end": 79.74, + "confidence": 0.964 + }, + { + "text": "le", + "start": 79.74, + "end": 79.88, + "confidence": 0.985 + }, + { + "text": "monde", + "start": 79.88, + "end": 80.24, + "confidence": 0.909 + }, + { + "text": "qui", + "start": 80.24, + "end": 81.02, + "confidence": 0.871 + }, + { + "text": "rendent", + "start": 81.02, + "end": 81.74, + "confidence": 0.623 + }, + { + "text": "un", + "start": 81.74, + "end": 81.84, + "confidence": 0.224 + }, + { + "text": "peu", + "start": 81.84, + "end": 81.88, + "confidence": 0.223 + }, + { + "text": "avec", + "start": 81.88, + "end": 82.1, + "confidence": 0.863 + }, + { + "text": "la", + "start": 82.1, + "end": 82.24, + "confidence": 0.565 + }, + { + "text": "même", + "start": 82.24, + "end": 82.32, + "confidence": 0.384 + }, + { + "text": "sédiforme", + "start": 82.32, + "end": 82.86, + "confidence": 0.29 + }, + { + "text": "de", + "start": 82.86, + "end": 82.98, + "confidence": 0.899 + } + ] + }, + { + "id": 24, + "seek": 8298, + "start": 83.0, + "end": 87.66, + "text": " le jeu. Donc, à objets inédits, rapport inédits.", + "tokens": [ + 476, + 16748, + 13, + 7477, + 11, + 1531, + 1111, + 25349, + 294, + 7811, + 1208, + 11, + 18018, + 294, + 7811, + 1208, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.4346100035167876, + "compression_ratio": 1.5907335907335907, + "no_speech_prob": 3.121094050584361e-05, + "confidence": 0.614, + "words": [ + { + "text": "le", + "start": 83.0, + "end": 83.12, + "confidence": 0.128 + }, + { + "text": "jeu.", + "start": 83.12, + "end": 83.64, + "confidence": 0.505 + }, + { + "text": "Donc,", + "start": 83.64, + "end": 84.48, + "confidence": 0.513 + }, + { + "text": "à", + "start": 84.48, + "end": 84.86, + "confidence": 0.634 + }, + { + "text": "objets", + "start": 84.86, + "end": 85.36, + "confidence": 0.547 + }, + { + "text": "inédits,", + "start": 85.36, + "end": 86.24, + "confidence": 0.73 + }, + { + "text": "rapport", + "start": 86.24, + "end": 86.62, + "confidence": 0.928 + }, + { + "text": "inédits.", + "start": 86.62, + "end": 87.66, + "confidence": 0.921 + } + ] + }, + { + "id": 25, + "seek": 8298, + "start": 88.08, + "end": 93.78, + "text": " Et, ce rapport, si j'en prends Nicolas, frère caractérisée par un mélange de dépenses", + "tokens": [ + 3790, + 11, + 1769, + 18018, + 11, + 1511, + 361, + 6, + 268, + 46750, + 38268, + 11, + 431, + 4212, + 1032, + 578, + 4198, + 50027, + 971, + 517, + 41953, + 933, + 368, + 27998, + 9085 + ], + "temperature": 0.0, + "avg_logprob": -0.4346100035167876, + "compression_ratio": 1.5907335907335907, + "no_speech_prob": 3.121094050584361e-05, + "confidence": 0.624, + "words": [ + { + "text": "Et,", + "start": 88.08, + "end": 88.3, + "confidence": 0.87 + }, + { + "text": "ce", + "start": 88.3, + "end": 88.8, + "confidence": 0.462 + }, + { + "text": "rapport,", + "start": 88.8, + "end": 89.28, + "confidence": 0.997 + }, + { + "text": "si", + "start": 89.28, + "end": 89.56, + "confidence": 0.913 + }, + { + "text": "j'en", + "start": 89.56, + "end": 89.74, + "confidence": 0.771 + }, + { + "text": "prends", + "start": 89.74, + "end": 89.84, + "confidence": 0.313 + }, + { + "text": "Nicolas,", + "start": 89.84, + "end": 90.54, + "confidence": 0.358 + }, + { + "text": "frère", + "start": 90.54, + "end": 91.06, + "confidence": 0.405 + }, + { + "text": "caractérisée", + "start": 91.06, + "end": 91.7, + "confidence": 0.567 + }, + { + "text": "par", + "start": 91.7, + "end": 92.12, + "confidence": 0.868 + }, + { + "text": "un", + "start": 92.12, + "end": 92.32, + "confidence": 0.989 + }, + { + "text": "mélange", + "start": 92.32, + "end": 92.96, + "confidence": 0.932 + }, + { + "text": "de", + "start": 92.96, + "end": 93.24, + "confidence": 0.812 + }, + { + "text": "dépenses", + "start": 93.24, + "end": 93.78, + "confidence": 0.404 + } + ] + }, + { + "id": 26, + "seek": 8298, + "start": 94.36, + "end": 94.98, + "text": " et de rojets.", + "tokens": [ + 1030, + 368, + 744, + 73, + 1385, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.4346100035167876, + "compression_ratio": 1.5907335907335907, + "no_speech_prob": 3.121094050584361e-05, + "confidence": 0.583, + "words": [ + { + "text": "et", + "start": 94.36, + "end": 94.52, + "confidence": 0.986 + }, + { + "text": "de", + "start": 94.52, + "end": 94.56, + "confidence": 0.996 + }, + { + "text": "rojets.", + "start": 94.56, + "end": 94.98, + "confidence": 0.41 + } + ] + }, + { + "id": 27, + "seek": 8298, + "start": 95.8, + "end": 100.4, + "text": " Bon, en vrai, il faudrait remonter très très finement toute l'histoire des objectes", + "tokens": [ + 7368, + 11, + 465, + 17815, + 11, + 1930, + 38694, + 8645, + 890, + 41806, + 5732, + 5732, + 962, + 1712, + 14953, + 287, + 6, + 29093, + 730, + 2657, + 279 + ], + "temperature": 0.0, + "avg_logprob": -0.4346100035167876, + "compression_ratio": 1.5907335907335907, + "no_speech_prob": 3.121094050584361e-05, + "confidence": 0.749, + "words": [ + { + "text": "Bon,", + "start": 95.8, + "end": 96.06, + "confidence": 0.71 + }, + { + "text": "en", + "start": 96.06, + "end": 96.54, + "confidence": 0.92 + }, + { + "text": "vrai,", + "start": 96.54, + "end": 96.88, + "confidence": 0.994 + }, + { + "text": "il", + "start": 96.88, + "end": 97.1, + "confidence": 0.985 + }, + { + "text": "faudrait", + "start": 97.1, + "end": 97.5, + "confidence": 0.932 + }, + { + "text": "remonter", + "start": 97.5, + "end": 98.02, + "confidence": 0.574 + }, + { + "text": "très", + "start": 98.02, + "end": 98.46, + "confidence": 0.984 + }, + { + "text": "très", + "start": 98.46, + "end": 98.76, + "confidence": 0.597 + }, + { + "text": "finement", + "start": 98.76, + "end": 99.36, + "confidence": 0.476 + }, + { + "text": "toute", + "start": 99.36, + "end": 99.68, + "confidence": 0.367 + }, + { + "text": "l'histoire", + "start": 99.68, + "end": 100.02, + "confidence": 0.909 + }, + { + "text": "des", + "start": 100.02, + "end": 100.2, + "confidence": 0.949 + }, + { + "text": "objectes", + "start": 100.2, + "end": 100.4, + "confidence": 0.805 + } + ] + }, + { + "id": 28, + "seek": 8298, + "start": 100.4, + "end": 105.14, + "text": " techniques et de leur infération dans le vie pour déterminer si ce rapport est totalement", + "tokens": [ + 7512, + 1030, + 368, + 9580, + 1536, + 526, + 2405, + 2680, + 476, + 4941, + 2016, + 2795, + 29725, + 260, + 1511, + 1769, + 18018, + 871, + 45203 + ], + "temperature": 0.0, + "avg_logprob": -0.4346100035167876, + "compression_ratio": 1.5907335907335907, + "no_speech_prob": 3.121094050584361e-05, + "confidence": 0.665, + "words": [ + { + "text": "techniques", + "start": 100.4, + "end": 101.02, + "confidence": 0.954 + }, + { + "text": "et", + "start": 101.02, + "end": 101.52, + "confidence": 0.967 + }, + { + "text": "de", + "start": 101.52, + "end": 101.64, + "confidence": 0.973 + }, + { + "text": "leur", + "start": 101.64, + "end": 101.78, + "confidence": 0.811 + }, + { + "text": "infération", + "start": 101.78, + "end": 102.22, + "confidence": 0.227 + }, + { + "text": "dans", + "start": 102.22, + "end": 102.46, + "confidence": 0.518 + }, + { + "text": "le", + "start": 102.46, + "end": 102.54, + "confidence": 0.511 + }, + { + "text": "vie", + "start": 102.54, + "end": 102.78, + "confidence": 0.612 + }, + { + "text": "pour", + "start": 102.78, + "end": 103.06, + "confidence": 0.933 + }, + { + "text": "déterminer", + "start": 103.06, + "end": 103.64, + "confidence": 0.954 + }, + { + "text": "si", + "start": 103.64, + "end": 103.74, + "confidence": 0.488 + }, + { + "text": "ce", + "start": 103.74, + "end": 103.86, + "confidence": 0.98 + }, + { + "text": "rapport", + "start": 103.86, + "end": 104.1, + "confidence": 0.997 + }, + { + "text": "est", + "start": 104.1, + "end": 104.88, + "confidence": 0.942 + }, + { + "text": "totalement", + "start": 104.88, + "end": 105.14, + "confidence": 0.854 + } + ] + }, + { + "id": 29, + "seek": 8298, + "start": 105.26, + "end": 105.78, + "text": " inédit.", + "tokens": [ + 294, + 7811, + 270, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.4346100035167876, + "compression_ratio": 1.5907335907335907, + "no_speech_prob": 3.121094050584361e-05, + "confidence": 0.943, + "words": [ + { + "text": "inédit.", + "start": 105.26, + "end": 105.78, + "confidence": 0.943 + } + ] + }, + { + "id": 30, + "seek": 8298, + "start": 106.14, + "end": 109.36, + "text": " Mais j'ai l'impression comme ça que Nicolas se trompe pas vraiment.", + "tokens": [ + 6313, + 361, + 6, + 1301, + 287, + 6, + 36107, + 5173, + 2788, + 631, + 38268, + 369, + 504, + 298, + 494, + 1736, + 8322, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.4346100035167876, + "compression_ratio": 1.5907335907335907, + "no_speech_prob": 3.121094050584361e-05, + "confidence": 0.798, + "words": [ + { + "text": "Mais", + "start": 106.14, + "end": 106.34, + "confidence": 0.872 + }, + { + "text": "j'ai", + "start": 106.34, + "end": 106.9, + "confidence": 0.924 + }, + { + "text": "l'impression", + "start": 106.9, + "end": 107.28, + "confidence": 0.967 + }, + { + "text": "comme", + "start": 107.28, + "end": 107.5, + "confidence": 0.709 + }, + { + "text": "ça", + "start": 107.5, + "end": 107.68, + "confidence": 0.955 + }, + { + "text": "que", + "start": 107.68, + "end": 107.96, + "confidence": 0.91 + }, + { + "text": "Nicolas", + "start": 107.96, + "end": 108.36, + "confidence": 0.986 + }, + { + "text": "se", + "start": 108.36, + "end": 108.66, + "confidence": 0.569 + }, + { + "text": "trompe", + "start": 108.66, + "end": 109.0, + "confidence": 0.532 + }, + { + "text": "pas", + "start": 109.0, + "end": 109.1, + "confidence": 0.715 + }, + { + "text": "vraiment.", + "start": 109.1, + "end": 109.36, + "confidence": 0.923 + } + ] + }, + { + "id": 31, + "seek": 10970, + "start": 109.72, + "end": 114.26, + "text": " Pour autant, je sache. Il y a eu plein de discussions autour de la voiture ou même", + "tokens": [ + 8732, + 34081, + 11, + 1506, + 262, + 6000, + 13, + 4416, + 288, + 257, + 2228, + 21088, + 368, + 11088, + 30249, + 368, + 635, + 38859, + 2820, + 5698 + ], + "temperature": 0.0, + "avg_logprob": -0.394765736144266, + "compression_ratio": 1.7249190938511327, + "no_speech_prob": 9.048193533089943e-06, + "confidence": 0.829, + "words": [ + { + "text": "Pour", + "start": 109.72, + "end": 110.08, + "confidence": 0.92 + }, + { + "text": "autant,", + "start": 110.08, + "end": 110.36, + "confidence": 0.986 + }, + { + "text": "je", + "start": 110.36, + "end": 110.4, + "confidence": 0.894 + }, + { + "text": "sache.", + "start": 110.4, + "end": 110.86, + "confidence": 0.531 + }, + { + "text": "Il", + "start": 110.86, + "end": 111.16, + "confidence": 0.851 + }, + { + "text": "y", + "start": 111.16, + "end": 111.22, + "confidence": 0.872 + }, + { + "text": "a", + "start": 111.22, + "end": 111.28, + "confidence": 0.939 + }, + { + "text": "eu", + "start": 111.28, + "end": 111.38, + "confidence": 0.891 + }, + { + "text": "plein", + "start": 111.38, + "end": 111.76, + "confidence": 0.833 + }, + { + "text": "de", + "start": 111.76, + "end": 112.04, + "confidence": 0.94 + }, + { + "text": "discussions", + "start": 112.04, + "end": 112.46, + "confidence": 0.711 + }, + { + "text": "autour", + "start": 112.46, + "end": 112.96, + "confidence": 0.97 + }, + { + "text": "de", + "start": 112.96, + "end": 113.46, + "confidence": 0.952 + }, + { + "text": "la", + "start": 113.46, + "end": 113.5, + "confidence": 0.955 + }, + { + "text": "voiture", + "start": 113.5, + "end": 113.8, + "confidence": 0.983 + }, + { + "text": "ou", + "start": 113.8, + "end": 114.02, + "confidence": 0.523 + }, + { + "text": "même", + "start": 114.02, + "end": 114.26, + "confidence": 0.963 + } + ] + }, + { + "id": 32, + "seek": 10970, + "start": 114.42, + "end": 118.76, + "text": " du téléphone. Mais la dépense n'était pas du même mort, donc le rejet n'en", + "tokens": [ + 1581, + 47159, + 13, + 6313, + 635, + 27998, + 1288, + 297, + 6, + 9743, + 1736, + 1581, + 5698, + 6599, + 11, + 5926, + 476, + 319, + 7108, + 297, + 6, + 268 + ], + "temperature": 0.0, + "avg_logprob": -0.394765736144266, + "compression_ratio": 1.7249190938511327, + "no_speech_prob": 9.048193533089943e-06, + "confidence": 0.732, + "words": [ + { + "text": "du", + "start": 114.42, + "end": 114.6, + "confidence": 0.677 + }, + { + "text": "téléphone.", + "start": 114.6, + "end": 115.16, + "confidence": 0.983 + }, + { + "text": "Mais", + "start": 115.16, + "end": 115.72, + "confidence": 0.649 + }, + { + "text": "la", + "start": 115.72, + "end": 116.0, + "confidence": 0.809 + }, + { + "text": "dépense", + "start": 116.0, + "end": 116.38, + "confidence": 0.766 + }, + { + "text": "n'était", + "start": 116.38, + "end": 116.62, + "confidence": 0.952 + }, + { + "text": "pas", + "start": 116.62, + "end": 117.02, + "confidence": 0.994 + }, + { + "text": "du", + "start": 117.02, + "end": 117.16, + "confidence": 0.98 + }, + { + "text": "même", + "start": 117.16, + "end": 117.32, + "confidence": 0.944 + }, + { + "text": "mort,", + "start": 117.32, + "end": 117.66, + "confidence": 0.519 + }, + { + "text": "donc", + "start": 117.66, + "end": 117.78, + "confidence": 0.871 + }, + { + "text": "le", + "start": 117.78, + "end": 118.32, + "confidence": 0.932 + }, + { + "text": "rejet", + "start": 118.32, + "end": 118.62, + "confidence": 0.524 + }, + { + "text": "n'en", + "start": 118.62, + "end": 118.76, + "confidence": 0.472 + } + ] + }, + { + "id": 33, + "seek": 10970, + "start": 118.76, + "end": 119.66, + "text": " plus n'était pas du même mort.", + "tokens": [ + 1804, + 297, + 6, + 9743, + 1736, + 1581, + 5698, + 6599, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.394765736144266, + "compression_ratio": 1.7249190938511327, + "no_speech_prob": 9.048193533089943e-06, + "confidence": 0.853, + "words": [ + { + "text": "plus", + "start": 118.76, + "end": 118.9, + "confidence": 0.313 + }, + { + "text": "n'était", + "start": 118.9, + "end": 119.1, + "confidence": 0.973 + }, + { + "text": "pas", + "start": 119.1, + "end": 119.26, + "confidence": 0.998 + }, + { + "text": "du", + "start": 119.26, + "end": 119.36, + "confidence": 0.988 + }, + { + "text": "même", + "start": 119.36, + "end": 119.5, + "confidence": 0.999 + }, + { + "text": "mort.", + "start": 119.5, + "end": 119.66, + "confidence": 0.984 + } + ] + }, + { + "id": 34, + "seek": 10970, + "start": 120.06, + "end": 122.94, + "text": " On peut adorer sa bagnure, en avoir besoin pour plein de choses.", + "tokens": [ + 1282, + 5977, + 614, + 17618, + 601, + 3411, + 77, + 540, + 11, + 465, + 10853, + 19207, + 2016, + 21088, + 368, + 14488, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.394765736144266, + "compression_ratio": 1.7249190938511327, + "no_speech_prob": 9.048193533089943e-06, + "confidence": 0.753, + "words": [ + { + "text": "On", + "start": 120.06, + "end": 120.22, + "confidence": 0.969 + }, + { + "text": "peut", + "start": 120.22, + "end": 120.32, + "confidence": 0.988 + }, + { + "text": "adorer", + "start": 120.32, + "end": 120.64, + "confidence": 0.854 + }, + { + "text": "sa", + "start": 120.64, + "end": 120.86, + "confidence": 0.918 + }, + { + "text": "bagnure,", + "start": 120.86, + "end": 121.38, + "confidence": 0.368 + }, + { + "text": "en", + "start": 121.38, + "end": 121.52, + "confidence": 0.56 + }, + { + "text": "avoir", + "start": 121.52, + "end": 121.66, + "confidence": 0.969 + }, + { + "text": "besoin", + "start": 121.66, + "end": 122.08, + "confidence": 0.997 + }, + { + "text": "pour", + "start": 122.08, + "end": 122.34, + "confidence": 0.92 + }, + { + "text": "plein", + "start": 122.34, + "end": 122.64, + "confidence": 0.9 + }, + { + "text": "de", + "start": 122.64, + "end": 122.78, + "confidence": 0.993 + }, + { + "text": "choses.", + "start": 122.78, + "end": 122.94, + "confidence": 0.994 + } + ] + }, + { + "id": 35, + "seek": 10970, + "start": 123.36, + "end": 126.38, + "text": " Et là, le soir, quand on va se coucher, on la laisse.", + "tokens": [ + 3790, + 3684, + 11, + 476, + 27105, + 11, + 6932, + 322, + 2773, + 369, + 1384, + 6759, + 11, + 322, + 635, + 30969, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.394765736144266, + "compression_ratio": 1.7249190938511327, + "no_speech_prob": 9.048193533089943e-06, + "confidence": 0.826, + "words": [ + { + "text": "Et", + "start": 123.36, + "end": 123.48, + "confidence": 0.557 + }, + { + "text": "là,", + "start": 123.48, + "end": 123.66, + "confidence": 0.527 + }, + { + "text": "le", + "start": 123.66, + "end": 124.02, + "confidence": 0.986 + }, + { + "text": "soir,", + "start": 124.02, + "end": 124.5, + "confidence": 0.966 + }, + { + "text": "quand", + "start": 124.5, + "end": 124.9, + "confidence": 0.774 + }, + { + "text": "on", + "start": 124.9, + "end": 125.02, + "confidence": 0.986 + }, + { + "text": "va", + "start": 125.02, + "end": 125.1, + "confidence": 0.968 + }, + { + "text": "se", + "start": 125.1, + "end": 125.2, + "confidence": 0.862 + }, + { + "text": "coucher,", + "start": 125.2, + "end": 125.64, + "confidence": 0.791 + }, + { + "text": "on", + "start": 125.64, + "end": 126.04, + "confidence": 0.974 + }, + { + "text": "la", + "start": 126.04, + "end": 126.12, + "confidence": 0.783 + }, + { + "text": "laisse.", + "start": 126.12, + "end": 126.38, + "confidence": 0.981 + } + ] + }, + { + "id": 36, + "seek": 10970, + "start": 127.06, + "end": 130.0, + "text": " On l'a pas dans la main, quand on est collis, quand on n'en mène pas au chiot.", + "tokens": [ + 1282, + 287, + 6, + 64, + 1736, + 2680, + 635, + 2135, + 11, + 6932, + 322, + 871, + 1263, + 271, + 11, + 6932, + 322, + 297, + 6, + 268, + 275, + 18832, + 1736, + 1609, + 417, + 6471, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.394765736144266, + "compression_ratio": 1.7249190938511327, + "no_speech_prob": 9.048193533089943e-06, + "confidence": 0.66, + "words": [ + { + "text": "On", + "start": 127.06, + "end": 127.3, + "confidence": 0.742 + }, + { + "text": "l'a", + "start": 127.3, + "end": 127.46, + "confidence": 0.714 + }, + { + "text": "pas", + "start": 127.46, + "end": 127.64, + "confidence": 0.99 + }, + { + "text": "dans", + "start": 127.64, + "end": 127.82, + "confidence": 0.967 + }, + { + "text": "la", + "start": 127.82, + "end": 127.94, + "confidence": 0.956 + }, + { + "text": "main,", + "start": 127.94, + "end": 128.3, + "confidence": 0.978 + }, + { + "text": "quand", + "start": 128.3, + "end": 128.44, + "confidence": 0.967 + }, + { + "text": "on", + "start": 128.44, + "end": 128.6, + "confidence": 0.993 + }, + { + "text": "est", + "start": 128.6, + "end": 128.66, + "confidence": 0.602 + }, + { + "text": "collis,", + "start": 128.66, + "end": 129.2, + "confidence": 0.346 + }, + { + "text": "quand", + "start": 129.2, + "end": 129.24, + "confidence": 0.524 + }, + { + "text": "on", + "start": 129.24, + "end": 129.32, + "confidence": 0.991 + }, + { + "text": "n'en", + "start": 129.32, + "end": 129.38, + "confidence": 0.537 + }, + { + "text": "mène", + "start": 129.38, + "end": 129.56, + "confidence": 0.434 + }, + { + "text": "pas", + "start": 129.56, + "end": 129.72, + "confidence": 0.998 + }, + { + "text": "au", + "start": 129.72, + "end": 129.82, + "confidence": 0.811 + }, + { + "text": "chiot.", + "start": 129.82, + "end": 130.0, + "confidence": 0.473 + } + ] + }, + { + "id": 37, + "seek": 10970, + "start": 130.88, + "end": 135.1, + "text": " On pouvait être émervé par son mome qui occupeait la ligne de téléphone pendant une", + "tokens": [ + 1282, + 45913, + 7418, + 1136, + 936, + 15797, + 971, + 1872, + 275, + 423, + 1956, + 2678, + 84, + 494, + 1001, + 635, + 34207, + 368, + 47159, + 17338, + 2251 + ], + "temperature": 0.0, + "avg_logprob": -0.394765736144266, + "compression_ratio": 1.7249190938511327, + "no_speech_prob": 9.048193533089943e-06, + "confidence": 0.672, + "words": [ + { + "text": "On", + "start": 130.88, + "end": 131.0, + "confidence": 0.991 + }, + { + "text": "pouvait", + "start": 131.0, + "end": 131.24, + "confidence": 0.532 + }, + { + "text": "être", + "start": 131.24, + "end": 131.7, + "confidence": 0.545 + }, + { + "text": "émervé", + "start": 131.7, + "end": 132.2, + "confidence": 0.725 + }, + { + "text": "par", + "start": 132.2, + "end": 132.42, + "confidence": 0.82 + }, + { + "text": "son", + "start": 132.42, + "end": 132.68, + "confidence": 0.448 + }, + { + "text": "mome", + "start": 132.68, + "end": 133.04, + "confidence": 0.261 + }, + { + "text": "qui", + "start": 133.04, + "end": 133.26, + "confidence": 0.901 + }, + { + "text": "occupeait", + "start": 133.26, + "end": 133.72, + "confidence": 0.641 + }, + { + "text": "la", + "start": 133.72, + "end": 133.8, + "confidence": 0.8 + }, + { + "text": "ligne", + "start": 133.8, + "end": 134.0, + "confidence": 0.976 + }, + { + "text": "de", + "start": 134.0, + "end": 134.14, + "confidence": 0.964 + }, + { + "text": "téléphone", + "start": 134.14, + "end": 134.44, + "confidence": 0.977 + }, + { + "text": "pendant", + "start": 134.44, + "end": 134.8, + "confidence": 0.92 + }, + { + "text": "une", + "start": 134.8, + "end": 135.1, + "confidence": 0.838 + } + ] + }, + { + "id": 38, + "seek": 10970, + "start": 135.1, + "end": 136.84, + "text": " heure chaque soir pour discuter avec un copain.", + "tokens": [ + 30027, + 18920, + 27105, + 2016, + 2983, + 20314, + 4163, + 517, + 2971, + 491, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.394765736144266, + "compression_ratio": 1.7249190938511327, + "no_speech_prob": 9.048193533089943e-06, + "confidence": 0.922, + "words": [ + { + "text": "heure", + "start": 135.1, + "end": 135.36, + "confidence": 0.701 + }, + { + "text": "chaque", + "start": 135.36, + "end": 135.52, + "confidence": 0.957 + }, + { + "text": "soir", + "start": 135.52, + "end": 135.76, + "confidence": 0.997 + }, + { + "text": "pour", + "start": 135.76, + "end": 135.94, + "confidence": 0.983 + }, + { + "text": "discuter", + "start": 135.94, + "end": 136.26, + "confidence": 0.882 + }, + { + "text": "avec", + "start": 136.26, + "end": 136.44, + "confidence": 0.993 + }, + { + "text": "un", + "start": 136.44, + "end": 136.6, + "confidence": 0.976 + }, + { + "text": "copain.", + "start": 136.6, + "end": 136.84, + "confidence": 0.948 + } + ] + }, + { + "id": 39, + "seek": 13702, + "start": 137.26, + "end": 141.8, + "text": " Mais ça ne ressemble pas à ce qu'on peut ressentir à voir même mome aujourd'hui", + "tokens": [ + 6313, + 2788, + 408, + 725, + 37227, + 1736, + 1531, + 1769, + 421, + 6, + 266, + 5977, + 24689, + 317, + 347, + 1531, + 10695, + 5698, + 275, + 423, + 14023, + 6, + 10556 + ], + "temperature": 0.0, + "avg_logprob": -0.5734858703613281, + "compression_ratio": 1.5562700964630225, + "no_speech_prob": 3.1260256037057843e-06, + "confidence": 0.716, + "words": [ + { + "text": "Mais", + "start": 137.26, + "end": 137.52, + "confidence": 0.967 + }, + { + "text": "ça", + "start": 137.52, + "end": 137.6, + "confidence": 0.859 + }, + { + "text": "ne", + "start": 137.6, + "end": 137.68, + "confidence": 0.681 + }, + { + "text": "ressemble", + "start": 137.68, + "end": 138.14, + "confidence": 0.743 + }, + { + "text": "pas", + "start": 138.14, + "end": 138.66, + "confidence": 0.524 + }, + { + "text": "à", + "start": 138.66, + "end": 138.94, + "confidence": 0.978 + }, + { + "text": "ce", + "start": 138.94, + "end": 139.02, + "confidence": 0.605 + }, + { + "text": "qu'on", + "start": 139.02, + "end": 139.16, + "confidence": 0.961 + }, + { + "text": "peut", + "start": 139.16, + "end": 139.3, + "confidence": 0.586 + }, + { + "text": "ressentir", + "start": 139.3, + "end": 140.04, + "confidence": 0.898 + }, + { + "text": "à", + "start": 140.04, + "end": 140.24, + "confidence": 0.352 + }, + { + "text": "voir", + "start": 140.24, + "end": 140.48, + "confidence": 0.918 + }, + { + "text": "même", + "start": 140.48, + "end": 140.86, + "confidence": 0.324 + }, + { + "text": "mome", + "start": 140.86, + "end": 141.18, + "confidence": 0.374 + }, + { + "text": "aujourd'hui", + "start": 141.18, + "end": 141.8, + "confidence": 0.949 + } + ] + }, + { + "id": 40, + "seek": 13702, + "start": 141.92, + "end": 145.76, + "text": " continuuellement avec son smartphone dans la main, comme c'était une sorte de estimateur", + "tokens": [ + 2993, + 31816, + 4163, + 1872, + 13307, + 2680, + 635, + 2135, + 11, + 5173, + 269, + 6, + 9743, + 2251, + 25559, + 368, + 8017, + 15540 + ], + "temperature": 0.0, + "avg_logprob": -0.5734858703613281, + "compression_ratio": 1.5562700964630225, + "no_speech_prob": 3.1260256037057843e-06, + "confidence": 0.584, + "words": [ + { + "text": "continuuellement", + "start": 141.92, + "end": 142.8, + "confidence": 0.327 + }, + { + "text": "avec", + "start": 142.8, + "end": 143.18, + "confidence": 0.903 + }, + { + "text": "son", + "start": 143.18, + "end": 143.36, + "confidence": 0.866 + }, + { + "text": "smartphone", + "start": 143.36, + "end": 143.64, + "confidence": 0.467 + }, + { + "text": "dans", + "start": 143.64, + "end": 143.92, + "confidence": 0.554 + }, + { + "text": "la", + "start": 143.92, + "end": 144.0, + "confidence": 0.972 + }, + { + "text": "main,", + "start": 144.0, + "end": 144.26, + "confidence": 0.997 + }, + { + "text": "comme", + "start": 144.26, + "end": 144.52, + "confidence": 0.95 + }, + { + "text": "c'était", + "start": 144.52, + "end": 144.78, + "confidence": 0.574 + }, + { + "text": "une", + "start": 144.78, + "end": 144.94, + "confidence": 0.971 + }, + { + "text": "sorte", + "start": 144.94, + "end": 145.1, + "confidence": 0.642 + }, + { + "text": "de", + "start": 145.1, + "end": 145.18, + "confidence": 0.268 + }, + { + "text": "estimateur", + "start": 145.18, + "end": 145.76, + "confidence": 0.415 + } + ] + }, + { + "id": 41, + "seek": 13702, + "start": 145.94, + "end": 148.88, + "text": " extère de l'intempis de lâcher à l'éantrénée, ça m'a eu immédiate.", + "tokens": [ + 1279, + 4212, + 368, + 287, + 6, + 686, + 15970, + 271, + 368, + 48835, + 6759, + 1531, + 287, + 6, + 526, + 394, + 81, + 3516, + 3856, + 11, + 2788, + 275, + 6, + 64, + 2228, + 3397, + 526, + 4504, + 473, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.5734858703613281, + "compression_ratio": 1.5562700964630225, + "no_speech_prob": 3.1260256037057843e-06, + "confidence": 0.401, + "words": [ + { + "text": "extère", + "start": 145.94, + "end": 146.38, + "confidence": 0.357 + }, + { + "text": "de", + "start": 146.38, + "end": 146.46, + "confidence": 0.253 + }, + { + "text": "l'intempis", + "start": 146.46, + "end": 146.7, + "confidence": 0.153 + }, + { + "text": "de", + "start": 146.7, + "end": 146.9, + "confidence": 0.858 + }, + { + "text": "lâcher", + "start": 146.9, + "end": 147.32, + "confidence": 0.824 + }, + { + "text": "à", + "start": 147.32, + "end": 147.44, + "confidence": 0.494 + }, + { + "text": "l'éantrénée,", + "start": 147.44, + "end": 147.94, + "confidence": 0.476 + }, + { + "text": "ça", + "start": 147.94, + "end": 148.0, + "confidence": 0.772 + }, + { + "text": "m'a", + "start": 148.0, + "end": 148.26, + "confidence": 0.532 + }, + { + "text": "eu", + "start": 148.26, + "end": 148.42, + "confidence": 0.181 + }, + { + "text": "immédiate.", + "start": 148.42, + "end": 148.88, + "confidence": 0.537 + } + ] + }, + { + "id": 42, + "seek": 13702, + "start": 149.08, + "end": 152.02, + "text": " Bon, je dis ça pour le mome, mais évidemment, va là pour nos aussi.", + "tokens": [ + 7368, + 11, + 1506, + 717, + 2788, + 2016, + 476, + 275, + 423, + 11, + 2420, + 24724, + 11, + 2773, + 3684, + 2016, + 3269, + 6212, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.5734858703613281, + "compression_ratio": 1.5562700964630225, + "no_speech_prob": 3.1260256037057843e-06, + "confidence": 0.529, + "words": [ + { + "text": "Bon,", + "start": 149.08, + "end": 149.3, + "confidence": 0.285 + }, + { + "text": "je", + "start": 149.3, + "end": 149.34, + "confidence": 0.425 + }, + { + "text": "dis", + "start": 149.34, + "end": 149.42, + "confidence": 0.316 + }, + { + "text": "ça", + "start": 149.42, + "end": 149.62, + "confidence": 0.953 + }, + { + "text": "pour", + "start": 149.62, + "end": 149.72, + "confidence": 0.971 + }, + { + "text": "le", + "start": 149.72, + "end": 149.82, + "confidence": 0.993 + }, + { + "text": "mome,", + "start": 149.82, + "end": 150.24, + "confidence": 0.575 + }, + { + "text": "mais", + "start": 150.24, + "end": 150.44, + "confidence": 0.713 + }, + { + "text": "évidemment,", + "start": 150.44, + "end": 151.1, + "confidence": 0.775 + }, + { + "text": "va", + "start": 151.1, + "end": 151.28, + "confidence": 0.381 + }, + { + "text": "là", + "start": 151.28, + "end": 151.42, + "confidence": 0.633 + }, + { + "text": "pour", + "start": 151.42, + "end": 151.62, + "confidence": 0.398 + }, + { + "text": "nos", + "start": 151.62, + "end": 151.7, + "confidence": 0.807 + }, + { + "text": "aussi.", + "start": 151.7, + "end": 152.02, + "confidence": 0.145 + } + ] + }, + { + "id": 43, + "seek": 13702, + "start": 152.66, + "end": 154.4, + "text": " Donc, rapport immédiate d'accord.", + "tokens": [ + 7477, + 11, + 18018, + 3397, + 526, + 4504, + 473, + 274, + 6, + 19947, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.5734858703613281, + "compression_ratio": 1.5562700964630225, + "no_speech_prob": 3.1260256037057843e-06, + "confidence": 0.851, + "words": [ + { + "text": "Donc,", + "start": 152.66, + "end": 153.0, + "confidence": 0.985 + }, + { + "text": "rapport", + "start": 153.0, + "end": 153.42, + "confidence": 0.977 + }, + { + "text": "immédiate", + "start": 153.42, + "end": 154.26, + "confidence": 0.825 + }, + { + "text": "d'accord.", + "start": 154.26, + "end": 154.4, + "confidence": 0.806 + } + ] + }, + { + "id": 44, + "seek": 13702, + "start": 154.4, + "end": 157.95, + "text": " Mais pourquoi, à ton impression qu'on en sortira jamais?", + "tokens": [ + 6313, + 19934, + 11, + 1531, + 2952, + 9995, + 421, + 6, + 266, + 465, + 26906, + 64, + 14540, + 30 + ], + "temperature": 0.0, + "avg_logprob": -0.5734858703613281, + "compression_ratio": 1.5562700964630225, + "no_speech_prob": 3.1260256037057843e-06, + "confidence": 0.791, + "words": [ + { + "text": "Mais", + "start": 154.4, + "end": 155.9, + "confidence": 0.984 + }, + { + "text": "pourquoi,", + "start": 155.9, + "end": 156.36, + "confidence": 0.959 + }, + { + "text": "à", + "start": 156.36, + "end": 156.48, + "confidence": 0.821 + }, + { + "text": "ton", + "start": 156.48, + "end": 156.66, + "confidence": 0.952 + }, + { + "text": "impression", + "start": 156.66, + "end": 156.96, + "confidence": 0.932 + }, + { + "text": "qu'on", + "start": 156.96, + "end": 157.28, + "confidence": 0.906 + }, + { + "text": "en", + "start": 157.28, + "end": 157.34, + "confidence": 0.789 + }, + { + "text": "sortira", + "start": 157.34, + "end": 157.84, + "confidence": 0.543 + }, + { + "text": "jamais?", + "start": 157.84, + "end": 157.95, + "confidence": 0.503 + } + ] + }, + { + "id": 45, + "seek": 13702, + "start": 157.95, + "end": 162.37, + "text": " Et puis, il faut en remettre la faute sur les gens qui ont créé cette", + "tokens": [ + 3790, + 9093, + 11, + 1930, + 8487, + 465, + 890, + 40681, + 635, + 2050, + 1169, + 1022, + 1512, + 10668, + 1956, + 6592, + 15609, + 526, + 5550 + ], + "temperature": 0.0, + "avg_logprob": -0.5734858703613281, + "compression_ratio": 1.5562700964630225, + "no_speech_prob": 3.1260256037057843e-06, + "confidence": 0.82, + "words": [ + { + "text": "Et", + "start": 157.95, + "end": 159.26, + "confidence": 0.838 + }, + { + "text": "puis,", + "start": 159.26, + "end": 159.58, + "confidence": 0.481 + }, + { + "text": "il", + "start": 159.58, + "end": 159.62, + "confidence": 0.665 + }, + { + "text": "faut", + "start": 159.62, + "end": 159.66, + "confidence": 0.942 + }, + { + "text": "en", + "start": 159.66, + "end": 159.72, + "confidence": 0.925 + }, + { + "text": "remettre", + "start": 159.72, + "end": 160.1, + "confidence": 0.985 + }, + { + "text": "la", + "start": 160.1, + "end": 160.28, + "confidence": 0.702 + }, + { + "text": "faute", + "start": 160.28, + "end": 160.62, + "confidence": 0.55 + }, + { + "text": "sur", + "start": 160.62, + "end": 160.9, + "confidence": 0.954 + }, + { + "text": "les", + "start": 160.9, + "end": 161.22, + "confidence": 0.81 + }, + { + "text": "gens", + "start": 161.22, + "end": 161.42, + "confidence": 0.985 + }, + { + "text": "qui", + "start": 161.42, + "end": 161.58, + "confidence": 0.981 + }, + { + "text": "ont", + "start": 161.58, + "end": 161.62, + "confidence": 0.955 + }, + { + "text": "créé", + "start": 161.62, + "end": 162.3, + "confidence": 0.957 + }, + { + "text": "cette", + "start": 162.3, + "end": 162.37, + "confidence": 0.9 + } + ] + }, + { + "id": 46, + "seek": 16228, + "start": 162.37, + "end": 165.3, + "text": " route merveilleux et diabolique, qui a dit à bollique par coeur, merveilleux.", + "tokens": [ + 7955, + 3551, + 303, + 3409, + 2449, + 1030, + 33227, + 401, + 1925, + 11, + 1956, + 257, + 6176, + 1531, + 748, + 285, + 1925, + 971, + 45781, + 11, + 3551, + 303, + 3409, + 2449, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.7643054464588994, + "compression_ratio": 1.544041450777202, + "no_speech_prob": 3.89045562769752e-05, + "confidence": 0.397, + "words": [ + { + "text": "route", + "start": 162.37, + "end": 162.6, + "confidence": 0.076 + }, + { + "text": "merveilleux", + "start": 162.6, + "end": 163.3, + "confidence": 0.635 + }, + { + "text": "et", + "start": 163.3, + "end": 163.42, + "confidence": 0.837 + }, + { + "text": "diabolique,", + "start": 163.42, + "end": 163.82, + "confidence": 0.328 + }, + { + "text": "qui", + "start": 163.82, + "end": 163.9, + "confidence": 0.365 + }, + { + "text": "a", + "start": 163.9, + "end": 163.98, + "confidence": 0.054 + }, + { + "text": "dit", + "start": 163.98, + "end": 164.06, + "confidence": 0.085 + }, + { + "text": "à", + "start": 164.06, + "end": 164.1, + "confidence": 0.433 + }, + { + "text": "bollique", + "start": 164.1, + "end": 164.3, + "confidence": 0.297 + }, + { + "text": "par", + "start": 164.3, + "end": 164.52, + "confidence": 0.634 + }, + { + "text": "coeur,", + "start": 164.52, + "end": 164.78, + "confidence": 0.361 + }, + { + "text": "merveilleux.", + "start": 164.78, + "end": 165.3, + "confidence": 0.982 + } + ] + }, + { + "id": 47, + "seek": 16228, + "start": 167.36, + "end": 168.7, + "text": " Les économistes parlent de dépendance du santé.", + "tokens": [ + 6965, + 31171, + 22368, + 13734, + 317, + 368, + 45768, + 719, + 1581, + 30068, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.7643054464588994, + "compression_ratio": 1.544041450777202, + "no_speech_prob": 3.89045562769752e-05, + "confidence": 0.748, + "words": [ + { + "text": "Les", + "start": 167.36, + "end": 167.4, + "confidence": 0.513 + }, + { + "text": "économistes", + "start": 167.4, + "end": 167.5, + "confidence": 0.937 + }, + { + "text": "parlent", + "start": 167.5, + "end": 167.78, + "confidence": 0.806 + }, + { + "text": "de", + "start": 167.78, + "end": 167.82, + "confidence": 0.855 + }, + { + "text": "dépendance", + "start": 167.82, + "end": 168.32, + "confidence": 0.758 + }, + { + "text": "du", + "start": 168.32, + "end": 168.5, + "confidence": 0.979 + }, + { + "text": "santé.", + "start": 168.5, + "end": 168.7, + "confidence": 0.389 + } + ] + }, + { + "id": 48, + "seek": 16228, + "start": 168.84, + "end": 172.66, + "text": " Ces vidéos, en fait, on est un santé qui a été établie, c'est un soit mon termine,", + "tokens": [ + 28414, + 25417, + 11, + 465, + 3887, + 11, + 322, + 871, + 517, + 30068, + 1956, + 257, + 8862, + 4823, + 455, + 6302, + 11, + 269, + 6, + 377, + 517, + 12703, + 1108, + 1433, + 533, + 11 + ], + "temperature": 0.0, + "avg_logprob": -0.7643054464588994, + "compression_ratio": 1.544041450777202, + "no_speech_prob": 3.89045562769752e-05, + "confidence": 0.487, + "words": [ + { + "text": "Ces", + "start": 168.84, + "end": 169.14, + "confidence": 0.531 + }, + { + "text": "vidéos,", + "start": 169.14, + "end": 169.5, + "confidence": 0.725 + }, + { + "text": "en", + "start": 169.5, + "end": 169.62, + "confidence": 0.757 + }, + { + "text": "fait,", + "start": 169.62, + "end": 169.68, + "confidence": 0.974 + }, + { + "text": "on", + "start": 169.68, + "end": 169.74, + "confidence": 0.306 + }, + { + "text": "est", + "start": 169.74, + "end": 169.86, + "confidence": 0.82 + }, + { + "text": "un", + "start": 169.86, + "end": 170.16, + "confidence": 0.245 + }, + { + "text": "santé", + "start": 170.16, + "end": 170.72, + "confidence": 0.943 + }, + { + "text": "qui", + "start": 170.72, + "end": 170.88, + "confidence": 0.839 + }, + { + "text": "a", + "start": 170.88, + "end": 170.96, + "confidence": 0.533 + }, + { + "text": "été", + "start": 170.96, + "end": 171.08, + "confidence": 0.992 + }, + { + "text": "établie,", + "start": 171.08, + "end": 171.6, + "confidence": 0.316 + }, + { + "text": "c'est", + "start": 171.6, + "end": 171.74, + "confidence": 0.55 + }, + { + "text": "un", + "start": 171.74, + "end": 171.88, + "confidence": 0.651 + }, + { + "text": "soit", + "start": 171.88, + "end": 172.12, + "confidence": 0.284 + }, + { + "text": "mon", + "start": 172.12, + "end": 172.28, + "confidence": 0.225 + }, + { + "text": "termine,", + "start": 172.28, + "end": 172.66, + "confidence": 0.288 + } + ] + }, + { + "id": 49, + "seek": 17312, + "start": 173.14, + "end": 177.42, + "text": " soit définissant des beurs, on définisse un signalétique.", + "tokens": [ + 50364, + 12703, + 40763, + 29492, + 730, + 312, + 2156, + 11, + 322, + 40763, + 7746, + 517, + 6358, + 42379, + 13, + 51436 + ], + "temperature": 0.0, + "avg_logprob": -0.9428024291992188, + "compression_ratio": 1.0169491525423728, + "no_speech_prob": 6.687085260637105e-05, + "confidence": 0.403, + "words": [ + { + "text": "soit", + "start": 173.14, + "end": 174.04, + "confidence": 0.127 + }, + { + "text": "définissant", + "start": 174.04, + "end": 175.5, + "confidence": 0.58 + }, + { + "text": "des", + "start": 175.5, + "end": 175.68, + "confidence": 0.813 + }, + { + "text": "beurs,", + "start": 175.68, + "end": 175.96, + "confidence": 0.378 + }, + { + "text": "on", + "start": 175.96, + "end": 176.04, + "confidence": 0.165 + }, + { + "text": "définisse", + "start": 176.04, + "end": 176.42, + "confidence": 0.536 + }, + { + "text": "un", + "start": 176.42, + "end": 176.6, + "confidence": 0.266 + }, + { + "text": "signalétique.", + "start": 176.6, + "end": 177.42, + "confidence": 0.544 + } + ] + } + ], + "language": "fr" +} \ No newline at end of file diff --git a/tests/expected/tiny_auto/accurate_japanese.mp3.words.json b/tests/expected/tiny_auto/accurate_japanese.mp3.words.json new file mode 100644 index 0000000000000000000000000000000000000000..3c1037657d4da75adabfdbc3838722088aa93fc5 --- /dev/null +++ b/tests/expected/tiny_auto/accurate_japanese.mp3.words.json @@ -0,0 +1,1766 @@ +{ + "text": "いきます ニュースタブでのサイトメイション機が 実際と違う検に関するご質問いただいております同じ度メインでデレクトリーごとに 別再度として管理上をしているサイトバリマスのサプテレクトリーごとにわけたサイトは それぞれ パブリシャーセンターに登録していくぐるニュース上ではサイトとして認識され パブリコンアイコンはサイトボトフのものが 正しく表示されますしかし ルグル検査結果のニュースタブでは パブリコンサイトメイショー機ともに 正しくない医療時にいいなりますこちらいたいです ものではありません パブリコンはサブテレクトリーごとに設定した", + "segments": [ + { + "id": 0, + "seek": 0, + "start": 0.04, + "end": 6.62, + "text": "いきます ニュースタブでのサイトメイション機が 実際と違う検に関するご質問いただいております", + "tokens": [ + 50364, + 47348, + 15096, + 233, + 26167, + 3384, + 9550, + 12144, + 28889, + 2474, + 2972, + 23607, + 8040, + 7588, + 21647, + 8040, + 43891, + 4824, + 17543, + 5142, + 220, + 33197, + 34837, + 3193, + 49806, + 38739, + 250, + 4108, + 5196, + 95, + 22570, + 9991, + 43450, + 11361, + 32418, + 18549, + 6117, + 19420, + 50712 + ], + "temperature": 0.0, + "avg_logprob": -0.4399989651095483, + "compression_ratio": 1.6122448979591837, + "no_speech_prob": 0.18976199626922607, + "confidence": 0.332, + "words": [ + { + "text": "いきます", + "start": 0.04, + "end": 0.56, + "confidence": 0.0 + }, + { + "text": " ニ", + "start": 0.56, + "end": 1.02, + "confidence": 0.012 + }, + { + "text": "ュ", + "start": 1.02, + "end": 1.36, + "confidence": 0.567 + }, + { + "text": "ー", + "start": 1.36, + "end": 1.5, + "confidence": 0.612 + }, + { + "text": "ス", + "start": 1.5, + "end": 1.52, + "confidence": 0.963 + }, + { + "text": "タ", + "start": 1.52, + "end": 1.68, + "confidence": 0.956 + }, + { + "text": "ブ", + "start": 1.68, + "end": 1.8, + "confidence": 0.788 + }, + { + "text": "で", + "start": 1.8, + "end": 2.02, + "confidence": 0.836 + }, + { + "text": "の", + "start": 2.02, + "end": 2.28, + "confidence": 0.869 + }, + { + "text": "サ", + "start": 2.28, + "end": 2.58, + "confidence": 0.031 + }, + { + "text": "イ", + "start": 2.58, + "end": 2.66, + "confidence": 0.98 + }, + { + "text": "ト", + "start": 2.66, + "end": 2.78, + "confidence": 0.994 + }, + { + "text": "メ", + "start": 2.78, + "end": 2.94, + "confidence": 0.356 + }, + { + "text": "イ", + "start": 2.94, + "end": 3.0, + "confidence": 0.162 + }, + { + "text": "ショ", + "start": 3.0, + "end": 3.14, + "confidence": 0.931 + }, + { + "text": "ン", + "start": 3.14, + "end": 3.2, + "confidence": 0.978 + }, + { + "text": "機", + "start": 3.2, + "end": 3.34, + "confidence": 0.409 + }, + { + "text": "が", + "start": 3.34, + "end": 3.5, + "confidence": 0.445 + }, + { + "text": " ", + "start": 3.5, + "end": 3.64, + "confidence": 0.094 + }, + { + "text": "実", + "start": 3.64, + "end": 3.76, + "confidence": 0.702 + }, + { + "text": "際", + "start": 3.76, + "end": 3.9, + "confidence": 0.968 + }, + { + "text": "と", + "start": 3.9, + "end": 4.08, + "confidence": 0.932 + }, + { + "text": "違う", + "start": 4.08, + "end": 4.38, + "confidence": 0.942 + }, + { + "text": "検", + "start": 4.38, + "end": 4.64, + "confidence": 0.255 + }, + { + "text": "に", + "start": 4.64, + "end": 4.74, + "confidence": 0.207 + }, + { + "text": "関", + "start": 4.74, + "end": 4.94, + "confidence": 0.412 + }, + { + "text": "する", + "start": 4.94, + "end": 5.12, + "confidence": 0.992 + }, + { + "text": "ご", + "start": 5.12, + "end": 5.3, + "confidence": 0.5 + }, + { + "text": "質", + "start": 5.3, + "end": 5.46, + "confidence": 0.843 + }, + { + "text": "問", + "start": 5.46, + "end": 5.62, + "confidence": 0.977 + }, + { + "text": "いただ", + "start": 5.62, + "end": 5.94, + "confidence": 0.913 + }, + { + "text": "いて", + "start": 5.94, + "end": 6.14, + "confidence": 0.982 + }, + { + "text": "お", + "start": 6.14, + "end": 6.26, + "confidence": 0.806 + }, + { + "text": "ります", + "start": 6.26, + "end": 6.62, + "confidence": 0.963 + } + ] + }, + { + "id": 1, + "seek": 0, + "start": 6.92, + "end": 13.58, + "text": "同じ度メインでデレクトリーごとに 別再度として管理上をしているサイトバリマスの", + "tokens": [ + 50712, + 13089, + 9257, + 13127, + 21647, + 8040, + 4824, + 2474, + 31327, + 16680, + 10825, + 7588, + 12376, + 3384, + 9991, + 3193, + 4108, + 220, + 16158, + 8623, + 13127, + 3193, + 8822, + 23131, + 13876, + 5708, + 5998, + 8822, + 22979, + 23607, + 8040, + 7588, + 18593, + 12376, + 13258, + 9550, + 2972, + 51044 + ], + "temperature": 0.0, + "avg_logprob": -0.4399989651095483, + "compression_ratio": 1.6122448979591837, + "no_speech_prob": 0.18976199626922607, + "confidence": 0.25, + "words": [ + { + "text": "同", + "start": 6.92, + "end": 7.26, + "confidence": 0.0 + }, + { + "text": "じ", + "start": 7.26, + "end": 7.44, + "confidence": 0.005 + }, + { + "text": "度", + "start": 7.44, + "end": 7.6, + "confidence": 0.003 + }, + { + "text": "メ", + "start": 7.6, + "end": 7.76, + "confidence": 0.002 + }, + { + "text": "イ", + "start": 7.76, + "end": 7.84, + "confidence": 0.684 + }, + { + "text": "ン", + "start": 7.84, + "end": 7.86, + "confidence": 0.889 + }, + { + "text": "で", + "start": 7.86, + "end": 8.0, + "confidence": 0.935 + }, + { + "text": "デ", + "start": 8.0, + "end": 8.12, + "confidence": 0.119 + }, + { + "text": "レ", + "start": 8.12, + "end": 8.28, + "confidence": 0.435 + }, + { + "text": "ク", + "start": 8.28, + "end": 8.36, + "confidence": 0.951 + }, + { + "text": "ト", + "start": 8.36, + "end": 8.5, + "confidence": 0.979 + }, + { + "text": "リ", + "start": 8.5, + "end": 8.62, + "confidence": 0.968 + }, + { + "text": "ー", + "start": 8.62, + "end": 8.72, + "confidence": 0.653 + }, + { + "text": "ご", + "start": 8.72, + "end": 8.84, + "confidence": 0.228 + }, + { + "text": "と", + "start": 8.84, + "end": 8.98, + "confidence": 0.993 + }, + { + "text": "に", + "start": 8.98, + "end": 9.14, + "confidence": 0.953 + }, + { + "text": " ", + "start": 9.14, + "end": 9.24, + "confidence": 0.042 + }, + { + "text": "別", + "start": 9.24, + "end": 9.4, + "confidence": 0.583 + }, + { + "text": "再", + "start": 9.4, + "end": 9.58, + "confidence": 0.443 + }, + { + "text": "度", + "start": 9.58, + "end": 9.74, + "confidence": 0.525 + }, + { + "text": "と", + "start": 9.74, + "end": 9.92, + "confidence": 0.876 + }, + { + "text": "して", + "start": 9.92, + "end": 10.42, + "confidence": 0.999 + }, + { + "text": "管", + "start": 10.42, + "end": 10.86, + "confidence": 0.314 + }, + { + "text": "理", + "start": 10.86, + "end": 11.06, + "confidence": 1.0 + }, + { + "text": "上", + "start": 11.06, + "end": 11.36, + "confidence": 0.208 + }, + { + "text": "を", + "start": 11.36, + "end": 11.56, + "confidence": 0.985 + }, + { + "text": "して", + "start": 11.56, + "end": 11.84, + "confidence": 0.937 + }, + { + "text": "いる", + "start": 11.84, + "end": 12.16, + "confidence": 0.942 + }, + { + "text": "サ", + "start": 12.16, + "end": 12.52, + "confidence": 0.078 + }, + { + "text": "イ", + "start": 12.52, + "end": 12.58, + "confidence": 0.978 + }, + { + "text": "ト", + "start": 12.58, + "end": 12.68, + "confidence": 0.982 + }, + { + "text": "バ", + "start": 12.68, + "end": 12.82, + "confidence": 0.259 + }, + { + "text": "リ", + "start": 12.82, + "end": 12.96, + "confidence": 0.363 + }, + { + "text": "マ", + "start": 12.96, + "end": 13.12, + "confidence": 0.114 + }, + { + "text": "ス", + "start": 13.12, + "end": 13.18, + "confidence": 0.881 + }, + { + "text": "の", + "start": 13.18, + "end": 13.58, + "confidence": 0.716 + } + ] + }, + { + "id": 2, + "seek": 0, + "start": 13.68, + "end": 20.72, + "text": "サプテレクトリーごとにわけたサイトは それぞれ パブリシャーセンターに登録していくぐるニュース上では", + "tokens": [ + 51044, + 23607, + 20953, + 22985, + 16680, + 10825, + 7588, + 12376, + 3384, + 9991, + 3193, + 4108, + 9206, + 7625, + 3368, + 23607, + 8040, + 7588, + 3065, + 47765, + 31563, + 4132, + 15096, + 239, + 28889, + 12376, + 11054, + 17233, + 3384, + 31223, + 4824, + 30736, + 4108, + 46246, + 8822, + 49394, + 35849, + 4895, + 34737, + 26167, + 3384, + 9550, + 5708, + 16719, + 51408 + ], + "temperature": 0.0, + "avg_logprob": -0.4399989651095483, + "compression_ratio": 1.6122448979591837, + "no_speech_prob": 0.18976199626922607, + "confidence": 0.465, + "words": [ + { + "text": "サ", + "start": 13.68, + "end": 14.22, + "confidence": 0.0 + }, + { + "text": "プ", + "start": 14.22, + "end": 14.32, + "confidence": 0.486 + }, + { + "text": "テ", + "start": 14.32, + "end": 14.42, + "confidence": 0.414 + }, + { + "text": "レ", + "start": 14.42, + "end": 14.6, + "confidence": 0.89 + }, + { + "text": "ク", + "start": 14.6, + "end": 14.68, + "confidence": 0.639 + }, + { + "text": "ト", + "start": 14.68, + "end": 14.78, + "confidence": 0.986 + }, + { + "text": "リ", + "start": 14.78, + "end": 14.92, + "confidence": 0.917 + }, + { + "text": "ー", + "start": 14.92, + "end": 15.04, + "confidence": 0.877 + }, + { + "text": "ご", + "start": 15.04, + "end": 15.1, + "confidence": 0.011 + }, + { + "text": "と", + "start": 15.1, + "end": 15.38, + "confidence": 0.985 + }, + { + "text": "に", + "start": 15.38, + "end": 15.86, + "confidence": 0.326 + }, + { + "text": "わ", + "start": 15.86, + "end": 16.02, + "confidence": 0.733 + }, + { + "text": "け", + "start": 16.02, + "end": 16.14, + "confidence": 0.989 + }, + { + "text": "た", + "start": 16.14, + "end": 16.28, + "confidence": 0.957 + }, + { + "text": "サ", + "start": 16.28, + "end": 16.42, + "confidence": 0.62 + }, + { + "text": "イ", + "start": 16.42, + "end": 16.52, + "confidence": 0.923 + }, + { + "text": "ト", + "start": 16.52, + "end": 16.6, + "confidence": 0.898 + }, + { + "text": "は", + "start": 16.6, + "end": 17.1, + "confidence": 0.989 + }, + { + "text": " それ", + "start": 17.1, + "end": 17.44, + "confidence": 0.057 + }, + { + "text": "ぞ", + "start": 17.44, + "end": 17.62, + "confidence": 0.824 + }, + { + "text": "れ", + "start": 17.62, + "end": 17.72, + "confidence": 0.996 + }, + { + "text": " パ", + "start": 17.72, + "end": 17.86, + "confidence": 0.096 + }, + { + "text": "ブ", + "start": 17.86, + "end": 17.94, + "confidence": 0.939 + }, + { + "text": "リ", + "start": 17.94, + "end": 18.04, + "confidence": 0.994 + }, + { + "text": "シ", + "start": 18.04, + "end": 18.18, + "confidence": 0.864 + }, + { + "text": "ャ", + "start": 18.18, + "end": 18.26, + "confidence": 0.87 + }, + { + "text": "ー", + "start": 18.26, + "end": 18.42, + "confidence": 0.815 + }, + { + "text": "セ", + "start": 18.42, + "end": 18.44, + "confidence": 0.619 + }, + { + "text": "ン", + "start": 18.44, + "end": 18.52, + "confidence": 0.801 + }, + { + "text": "ター", + "start": 18.52, + "end": 18.62, + "confidence": 0.998 + }, + { + "text": "に", + "start": 18.62, + "end": 18.76, + "confidence": 0.832 + }, + { + "text": "登録", + "start": 18.76, + "end": 19.12, + "confidence": 0.958 + }, + { + "text": "して", + "start": 19.12, + "end": 19.38, + "confidence": 0.727 + }, + { + "text": "いく", + "start": 19.38, + "end": 19.62, + "confidence": 0.781 + }, + { + "text": "ぐ", + "start": 19.62, + "end": 19.8, + "confidence": 0.084 + }, + { + "text": "る", + "start": 19.8, + "end": 19.88, + "confidence": 0.864 + }, + { + "text": "ニ", + "start": 19.88, + "end": 20.02, + "confidence": 0.718 + }, + { + "text": "ュ", + "start": 20.02, + "end": 20.14, + "confidence": 0.996 + }, + { + "text": "ー", + "start": 20.14, + "end": 20.16, + "confidence": 0.99 + }, + { + "text": "ス", + "start": 20.16, + "end": 20.22, + "confidence": 0.986 + }, + { + "text": "上", + "start": 20.22, + "end": 20.4, + "confidence": 0.167 + }, + { + "text": "では", + "start": 20.4, + "end": 20.72, + "confidence": 0.803 + } + ] + }, + { + "id": 3, + "seek": 2088, + "start": 20.88, + "end": 27.0, + "text": "サイトとして認識され パブリコンアイコンはサイトボトフのものが 正しく表示されます", + "tokens": [ + 50364, + 23607, + 8040, + 7588, + 3193, + 8822, + 22041, + 43143, + 6722, + 4132, + 15096, + 239, + 28889, + 12376, + 18066, + 4824, + 12817, + 8040, + 18066, + 4824, + 3065, + 23607, + 8040, + 7588, + 37626, + 7588, + 17320, + 2972, + 44726, + 5142, + 220, + 15789, + 26568, + 40053, + 6722, + 4132, + 5368, + 50684 + ], + "temperature": 0.0, + "avg_logprob": -0.35158648256395686, + "compression_ratio": 1.6926406926406927, + "no_speech_prob": 0.06365812569856644, + "confidence": 0.309, + "words": [ + { + "text": "サ", + "start": 20.88, + "end": 21.26, + "confidence": 0.0 + }, + { + "text": "イ", + "start": 21.26, + "end": 21.34, + "confidence": 0.967 + }, + { + "text": "ト", + "start": 21.34, + "end": 21.44, + "confidence": 0.596 + }, + { + "text": "と", + "start": 21.44, + "end": 21.6, + "confidence": 0.75 + }, + { + "text": "して", + "start": 21.6, + "end": 21.82, + "confidence": 0.984 + }, + { + "text": "認", + "start": 21.82, + "end": 22.08, + "confidence": 0.081 + }, + { + "text": "識", + "start": 22.08, + "end": 22.2, + "confidence": 0.995 + }, + { + "text": "さ", + "start": 22.2, + "end": 22.36, + "confidence": 0.979 + }, + { + "text": "れ", + "start": 22.36, + "end": 22.62, + "confidence": 0.909 + }, + { + "text": " パ", + "start": 22.62, + "end": 22.86, + "confidence": 0.086 + }, + { + "text": "ブ", + "start": 22.86, + "end": 23.0, + "confidence": 0.087 + }, + { + "text": "リ", + "start": 23.0, + "end": 23.16, + "confidence": 0.007 + }, + { + "text": "コ", + "start": 23.16, + "end": 23.26, + "confidence": 0.645 + }, + { + "text": "ン", + "start": 23.26, + "end": 23.28, + "confidence": 0.921 + }, + { + "text": "ア", + "start": 23.28, + "end": 23.46, + "confidence": 0.084 + }, + { + "text": "イ", + "start": 23.46, + "end": 23.52, + "confidence": 0.944 + }, + { + "text": "コ", + "start": 23.52, + "end": 23.64, + "confidence": 0.258 + }, + { + "text": "ン", + "start": 23.64, + "end": 23.88, + "confidence": 0.956 + }, + { + "text": "は", + "start": 23.88, + "end": 23.9, + "confidence": 0.873 + }, + { + "text": "サ", + "start": 23.9, + "end": 24.04, + "confidence": 0.868 + }, + { + "text": "イ", + "start": 24.04, + "end": 24.16, + "confidence": 0.996 + }, + { + "text": "ト", + "start": 24.16, + "end": 24.24, + "confidence": 0.993 + }, + { + "text": "ボ", + "start": 24.24, + "end": 24.38, + "confidence": 0.656 + }, + { + "text": "ト", + "start": 24.38, + "end": 24.5, + "confidence": 0.892 + }, + { + "text": "フ", + "start": 24.5, + "end": 24.66, + "confidence": 0.018 + }, + { + "text": "の", + "start": 24.66, + "end": 24.7, + "confidence": 0.672 + }, + { + "text": "もの", + "start": 24.7, + "end": 24.9, + "confidence": 0.528 + }, + { + "text": "が", + "start": 24.9, + "end": 25.1, + "confidence": 0.195 + }, + { + "text": " ", + "start": 25.1, + "end": 25.32, + "confidence": 0.184 + }, + { + "text": "正", + "start": 25.32, + "end": 25.4, + "confidence": 0.433 + }, + { + "text": "しく", + "start": 25.4, + "end": 25.66, + "confidence": 0.982 + }, + { + "text": "表示", + "start": 25.66, + "end": 26.0, + "confidence": 0.706 + }, + { + "text": "さ", + "start": 26.0, + "end": 26.28, + "confidence": 0.995 + }, + { + "text": "れ", + "start": 26.28, + "end": 26.56, + "confidence": 0.986 + }, + { + "text": "ます", + "start": 26.56, + "end": 27.0, + "confidence": 0.866 + } + ] + }, + { + "id": 4, + "seek": 2088, + "start": 27.26, + "end": 33.8, + "text": "しかし ルグル検査結果のニュースタブでは パブリコンサイトメイショー機ともに 正しくない医療時にいいなります", + "tokens": [ + 50684, + 32156, + 2849, + 220, + 9405, + 23839, + 9405, + 38739, + 250, + 17238, + 119, + 35181, + 2972, + 34737, + 26167, + 3384, + 9550, + 12144, + 28889, + 16719, + 15096, + 239, + 28889, + 12376, + 18066, + 4824, + 23607, + 8040, + 7588, + 21647, + 8040, + 43891, + 3384, + 17543, + 3193, + 4801, + 4108, + 220, + 15789, + 26568, + 9311, + 9937, + 119, + 6651, + 224, + 6611, + 4108, + 13806, + 3203, + 19420, + 51024 + ], + "temperature": 0.0, + "avg_logprob": -0.35158648256395686, + "compression_ratio": 1.6926406926406927, + "no_speech_prob": 0.06365812569856644, + "confidence": 0.359, + "words": [ + { + "text": "しか", + "start": 27.26, + "end": 27.56, + "confidence": 0.0 + }, + { + "text": "し", + "start": 27.56, + "end": 27.74, + "confidence": 0.945 + }, + { + "text": " ", + "start": 27.74, + "end": 27.9, + "confidence": 0.02 + }, + { + "text": "ル", + "start": 27.9, + "end": 27.92, + "confidence": 0.176 + }, + { + "text": "グ", + "start": 27.92, + "end": 28.02, + "confidence": 0.43 + }, + { + "text": "ル", + "start": 28.02, + "end": 28.14, + "confidence": 0.988 + }, + { + "text": "検", + "start": 28.14, + "end": 28.32, + "confidence": 0.569 + }, + { + "text": "査", + "start": 28.32, + "end": 28.46, + "confidence": 0.293 + }, + { + "text": "結果", + "start": 28.46, + "end": 28.72, + "confidence": 0.962 + }, + { + "text": "の", + "start": 28.72, + "end": 28.92, + "confidence": 0.932 + }, + { + "text": "ニ", + "start": 28.92, + "end": 29.06, + "confidence": 0.797 + }, + { + "text": "ュ", + "start": 29.06, + "end": 29.14, + "confidence": 0.995 + }, + { + "text": "ー", + "start": 29.14, + "end": 29.2, + "confidence": 0.985 + }, + { + "text": "ス", + "start": 29.2, + "end": 29.24, + "confidence": 0.978 + }, + { + "text": "タ", + "start": 29.24, + "end": 29.34, + "confidence": 0.787 + }, + { + "text": "ブ", + "start": 29.34, + "end": 29.44, + "confidence": 0.571 + }, + { + "text": "では", + "start": 29.44, + "end": 29.66, + "confidence": 0.966 + }, + { + "text": " パ", + "start": 29.66, + "end": 30.02, + "confidence": 0.104 + }, + { + "text": "ブ", + "start": 30.02, + "end": 30.14, + "confidence": 0.052 + }, + { + "text": "リ", + "start": 30.14, + "end": 30.24, + "confidence": 0.013 + }, + { + "text": "コ", + "start": 30.24, + "end": 30.32, + "confidence": 0.834 + }, + { + "text": "ン", + "start": 30.32, + "end": 30.42, + "confidence": 0.934 + }, + { + "text": "サ", + "start": 30.42, + "end": 30.54, + "confidence": 0.495 + }, + { + "text": "イ", + "start": 30.54, + "end": 30.62, + "confidence": 0.969 + }, + { + "text": "ト", + "start": 30.62, + "end": 30.72, + "confidence": 0.955 + }, + { + "text": "メ", + "start": 30.72, + "end": 30.86, + "confidence": 0.254 + }, + { + "text": "イ", + "start": 30.86, + "end": 30.92, + "confidence": 0.503 + }, + { + "text": "ショ", + "start": 30.92, + "end": 31.04, + "confidence": 0.465 + }, + { + "text": "ー", + "start": 31.04, + "end": 31.08, + "confidence": 0.612 + }, + { + "text": "機", + "start": 31.08, + "end": 31.24, + "confidence": 0.115 + }, + { + "text": "と", + "start": 31.24, + "end": 31.42, + "confidence": 0.22 + }, + { + "text": "も", + "start": 31.42, + "end": 31.56, + "confidence": 0.836 + }, + { + "text": "に", + "start": 31.56, + "end": 31.66, + "confidence": 0.941 + }, + { + "text": " ", + "start": 31.66, + "end": 31.8, + "confidence": 0.378 + }, + { + "text": "正", + "start": 31.8, + "end": 31.92, + "confidence": 0.34 + }, + { + "text": "しく", + "start": 31.92, + "end": 32.18, + "confidence": 0.998 + }, + { + "text": "ない", + "start": 32.18, + "end": 32.4, + "confidence": 0.99 + }, + { + "text": "医", + "start": 32.4, + "end": 32.6, + "confidence": 0.268 + }, + { + "text": "療", + "start": 32.6, + "end": 32.76, + "confidence": 0.576 + }, + { + "text": "時", + "start": 32.76, + "end": 32.96, + "confidence": 0.463 + }, + { + "text": "に", + "start": 32.96, + "end": 33.12, + "confidence": 0.905 + }, + { + "text": "いい", + "start": 33.12, + "end": 33.36, + "confidence": 0.566 + }, + { + "text": "な", + "start": 33.36, + "end": 33.48, + "confidence": 0.835 + }, + { + "text": "ります", + "start": 33.48, + "end": 33.8, + "confidence": 0.963 + } + ] + }, + { + "id": 5, + "seek": 2088, + "start": 34.02, + "end": 40.38, + "text": "こちらいたいです ものではありません パブリコンはサブテレクトリーごとに設定した", + "tokens": [ + 51024, + 34395, + 17679, + 1764, + 4767, + 32505, + 2972, + 16719, + 14498, + 30250, + 15096, + 239, + 28889, + 12376, + 18066, + 4824, + 3065, + 23607, + 28889, + 22985, + 16680, + 10825, + 7588, + 12376, + 3384, + 9991, + 3193, + 4108, + 39035, + 12088, + 8533, + 51388 + ], + "temperature": 0.0, + "avg_logprob": -0.35158648256395686, + "compression_ratio": 1.6926406926406927, + "no_speech_prob": 0.06365812569856644, + "confidence": 0.194, + "words": [ + { + "text": "こちら", + "start": 34.02, + "end": 34.48, + "confidence": 0.0 + }, + { + "text": "いた", + "start": 34.48, + "end": 34.82, + "confidence": 0.102 + }, + { + "text": "い", + "start": 34.82, + "end": 35.0, + "confidence": 0.002 + }, + { + "text": "です", + "start": 35.0, + "end": 35.14, + "confidence": 0.005 + }, + { + "text": " も", + "start": 35.14, + "end": 35.18, + "confidence": 0.003 + }, + { + "text": "の", + "start": 35.18, + "end": 35.28, + "confidence": 0.735 + }, + { + "text": "では", + "start": 35.28, + "end": 35.5, + "confidence": 0.984 + }, + { + "text": "あり", + "start": 35.5, + "end": 35.72, + "confidence": 0.96 + }, + { + "text": "ません", + "start": 35.72, + "end": 36.14, + "confidence": 1.0 + }, + { + "text": " パ", + "start": 36.14, + "end": 36.9, + "confidence": 0.222 + }, + { + "text": "ブ", + "start": 36.9, + "end": 37.02, + "confidence": 0.011 + }, + { + "text": "リ", + "start": 37.02, + "end": 37.06, + "confidence": 0.33 + }, + { + "text": "コ", + "start": 37.06, + "end": 37.18, + "confidence": 0.919 + }, + { + "text": "ン", + "start": 37.18, + "end": 37.94, + "confidence": 0.844 + }, + { + "text": "は", + "start": 37.94, + "end": 37.96, + "confidence": 0.942 + }, + { + "text": "サ", + "start": 37.96, + "end": 38.24, + "confidence": 0.27 + }, + { + "text": "ブ", + "start": 38.24, + "end": 38.32, + "confidence": 0.976 + }, + { + "text": "テ", + "start": 38.32, + "end": 38.42, + "confidence": 0.368 + }, + { + "text": "レ", + "start": 38.42, + "end": 38.56, + "confidence": 0.373 + }, + { + "text": "ク", + "start": 38.56, + "end": 38.66, + "confidence": 0.751 + }, + { + "text": "ト", + "start": 38.66, + "end": 38.78, + "confidence": 0.819 + }, + { + "text": "リ", + "start": 38.78, + "end": 38.92, + "confidence": 0.984 + }, + { + "text": "ー", + "start": 38.92, + "end": 38.96, + "confidence": 0.512 + }, + { + "text": "ご", + "start": 38.96, + "end": 39.08, + "confidence": 0.029 + }, + { + "text": "と", + "start": 39.08, + "end": 39.22, + "confidence": 0.975 + }, + { + "text": "に", + "start": 39.22, + "end": 39.56, + "confidence": 0.971 + }, + { + "text": "設", + "start": 39.56, + "end": 39.84, + "confidence": 0.666 + }, + { + "text": "定", + "start": 39.84, + "end": 40.06, + "confidence": 0.996 + }, + { + "text": "した", + "start": 40.06, + "end": 40.38, + "confidence": 0.938 + } + ] + } + ], + "language": "ja", + "language_probs": { + "en": 0.006242657545953989, + "zh": 0.0014827612321823835, + "de": 0.00011256561992922798, + "es": 0.0013291386421769857, + "ru": 0.00022561925288755447, + "ko": 0.00042481819400563836, + "fr": 0.0003206696128472686, + "ja": 0.9862462282180786, + "pt": 0.0003521866456139833, + "tr": 8.698396413819864e-05, + "pl": 0.0008716703741811216, + "ca": 1.310503307649924e-06, + "nl": 1.0388754162704572e-05, + "ar": 1.634380350878928e-05, + "sv": 1.8519956938689575e-05, + "it": 0.0001502948289271444, + "id": 1.4650489902123809e-05, + "hi": 3.542034392012283e-05, + "fi": 3.327432932564989e-05, + "vi": 9.459067769057583e-06, + "he": 1.488120233261725e-05, + "uk": 2.396660238446202e-05, + "el": 3.683132672449574e-05, + "ms": 3.514470154186711e-05, + "cs": 1.2629512639250606e-05, + "ro": 2.034019234997686e-05, + "da": 7.294049737538444e-07, + "hu": 8.41306882648496e-06, + "ta": 3.047011659873533e-06, + "no": 4.935400852446037e-07, + "th": 2.396660238446202e-05, + "ur": 1.823282946133986e-05, + "hr": 3.2435270895803114e-06, + "bg": 5.906901492380712e-07, + "lt": 1.666117981358184e-07, + "la": 0.00018271202861797065, + "mi": 8.044702553888783e-05, + "ml": 1.6182557374122553e-06, + "cy": 6.168086838442832e-05, + "sk": 7.948603979457403e-07, + "te": 2.2118931610748405e-06, + "fa": 1.647198951104656e-05, + "lv": 2.2245595232561755e-07, + "bn": 1.0470233064552303e-05, + "sr": 5.132005185259914e-07, + "az": 6.641308232246956e-07, + "sl": 1.0286258884661947e-06, + "kn": 4.97411008382187e-07, + "et": 6.641308232246956e-07, + "mk": 2.2420069001327647e-07, + "br": 3.301538890809752e-05, + "eu": 3.920674862456508e-05, + "is": 1.7324887835457048e-07, + "hy": 1.6566315252930508e-06, + "ne": 9.148787967205863e-07, + "mn": 2.098585719068069e-05, + "bs": 1.1565151680770214e-06, + "kk": 2.4623628291919886e-07, + "sq": 8.798302815193892e-07, + "sw": 8.885971510608215e-06, + "gl": 4.239260306349024e-05, + "mr": 5.725165124204068e-07, + "pa": 1.6309478496623342e-06, + "si": 1.4423355423787143e-05, + "km": 4.045130481244996e-05, + "sn": 2.304845656908583e-05, + "yo": 3.3991873351624236e-06, + "so": 2.3866036258368695e-07, + "af": 9.969784287022776e-07, + "oc": 5.474488716572523e-06, + "ka": 1.0864454225156805e-06, + "be": 5.692566901416285e-06, + "tg": 1.913662650565584e-08, + "sd": 1.6959174899966456e-06, + "gu": 3.2115266890286875e-07, + "am": 1.2975741014997766e-07, + "yi": 4.197435828245943e-06, + "lo": 2.600773427730019e-07, + "uz": 3.430495609801909e-10, + "fo": 1.4281055200626724e-06, + "ht": 2.373014922341099e-06, + "ps": 1.5321337514251354e-06, + "tk": 7.745855623575437e-10, + "nn": 0.0009135027066804469, + "mt": 1.0673553418882875e-07, + "sa": 1.7262496839975938e-05, + "lb": 3.051601860093456e-09, + "my": 2.098585719068069e-05, + "bo": 1.303041608480271e-05, + "tl": 7.029382231849013e-06, + "mg": 1.3073606641711422e-09, + "as": 4.321581172916922e-07, + "tt": 3.4714515706468774e-09, + "haw": 2.8909242246299982e-05, + "ln": 8.594491305302654e-07, + "ha": 6.384976991569147e-09, + "ba": 5.375886957814657e-10, + "jw": 0.00019148056162521243, + "su": 3.087572864046706e-09 + } +} \ No newline at end of file diff --git a/tests/expected/tiny_auto/accurate_jp_japanese.mp3.words.json b/tests/expected/tiny_auto/accurate_jp_japanese.mp3.words.json new file mode 100644 index 0000000000000000000000000000000000000000..97df2ecc55e5966301e8c2c89c03de20fa39ae73 --- /dev/null +++ b/tests/expected/tiny_auto/accurate_jp_japanese.mp3.words.json @@ -0,0 +1,1665 @@ +{ + "text": "いきます ニュースタブでのサイトメイション機が 実際と違う検に関するご質問いただいております同じ度メインでデレクトリーごとに 別再度として管理上をしているサイトバリマスのサプテレクトリーごとにわけたサイトは それぞれ パブリシャーセンターに登録していくぐるニュース上ではサイトとして認識され パブリコンアイコンはサイトボトフのものが 正しく表示されますしかし ルグル検査結果のニュースタブでは パブリコンサイトメイショー機ともに 正しくない医療時にいいなりますこちらいたいです ものではありません パブリコンはサブテレクトリーごとに設定した", + "segments": [ + { + "id": 0, + "seek": 0, + "start": 0.08, + "end": 6.62, + "text": "いきます ニュースタブでのサイトメイション機が 実際と違う検に関するご質問いただいております", + "tokens": [ + 50364, + 47348, + 15096, + 233, + 26167, + 3384, + 9550, + 12144, + 28889, + 2474, + 2972, + 23607, + 8040, + 7588, + 21647, + 8040, + 43891, + 4824, + 17543, + 5142, + 220, + 33197, + 34837, + 3193, + 49806, + 38739, + 250, + 4108, + 5196, + 95, + 22570, + 9991, + 43450, + 11361, + 32418, + 18549, + 6117, + 19420, + 50712 + ], + "temperature": 0.0, + "avg_logprob": -0.4399989651095483, + "compression_ratio": 1.6122448979591837, + "no_speech_prob": 0.18976199626922607, + "confidence": 0.549, + "words": [ + { + "text": "いきます", + "start": 0.08, + "end": 0.6, + "confidence": 0.173 + }, + { + "text": " ニ", + "start": 0.6, + "end": 1.32, + "confidence": 0.187 + }, + { + "text": "ュ", + "start": 1.32, + "end": 1.38, + "confidence": 0.974 + }, + { + "text": "ー", + "start": 1.38, + "end": 1.5, + "confidence": 0.945 + }, + { + "text": "ス", + "start": 1.5, + "end": 1.52, + "confidence": 0.961 + }, + { + "text": "タ", + "start": 1.52, + "end": 1.68, + "confidence": 0.87 + }, + { + "text": "ブ", + "start": 1.68, + "end": 1.8, + "confidence": 0.772 + }, + { + "text": "で", + "start": 1.8, + "end": 2.02, + "confidence": 0.948 + }, + { + "text": "の", + "start": 2.02, + "end": 2.26, + "confidence": 0.838 + }, + { + "text": "サ", + "start": 2.26, + "end": 2.56, + "confidence": 0.015 + }, + { + "text": "イ", + "start": 2.56, + "end": 2.66, + "confidence": 0.983 + }, + { + "text": "ト", + "start": 2.66, + "end": 2.76, + "confidence": 0.992 + }, + { + "text": "メ", + "start": 2.76, + "end": 2.94, + "confidence": 0.385 + }, + { + "text": "イ", + "start": 2.94, + "end": 3.0, + "confidence": 0.233 + }, + { + "text": "ショ", + "start": 3.0, + "end": 3.14, + "confidence": 0.894 + }, + { + "text": "ン", + "start": 3.14, + "end": 3.2, + "confidence": 0.983 + }, + { + "text": "機", + "start": 3.2, + "end": 3.32, + "confidence": 0.363 + }, + { + "text": "が", + "start": 3.32, + "end": 3.5, + "confidence": 0.64 + }, + { + "text": " ", + "start": 3.5, + "end": 3.6, + "confidence": 0.232 + }, + { + "text": "実", + "start": 3.6, + "end": 3.76, + "confidence": 0.75 + }, + { + "text": "際", + "start": 3.76, + "end": 3.9, + "confidence": 0.98 + }, + { + "text": "と", + "start": 3.9, + "end": 4.08, + "confidence": 0.928 + }, + { + "text": "違う", + "start": 4.08, + "end": 4.38, + "confidence": 0.898 + }, + { + "text": "検", + "start": 4.38, + "end": 4.64, + "confidence": 0.327 + }, + { + "text": "に", + "start": 4.64, + "end": 4.74, + "confidence": 0.187 + }, + { + "text": "関", + "start": 4.74, + "end": 4.94, + "confidence": 0.497 + }, + { + "text": "する", + "start": 4.94, + "end": 5.12, + "confidence": 0.988 + }, + { + "text": "ご", + "start": 5.12, + "end": 5.3, + "confidence": 0.649 + }, + { + "text": "質", + "start": 5.3, + "end": 5.46, + "confidence": 0.893 + }, + { + "text": "問", + "start": 5.46, + "end": 5.62, + "confidence": 0.992 + }, + { + "text": "いただ", + "start": 5.62, + "end": 5.92, + "confidence": 0.936 + }, + { + "text": "いて", + "start": 5.92, + "end": 6.14, + "confidence": 0.981 + }, + { + "text": "お", + "start": 6.14, + "end": 6.26, + "confidence": 0.817 + }, + { + "text": "ります", + "start": 6.26, + "end": 6.62, + "confidence": 0.971 + } + ] + }, + { + "id": 1, + "seek": 0, + "start": 6.94, + "end": 13.58, + "text": "同じ度メインでデレクトリーごとに 別再度として管理上をしているサイトバリマスの", + "tokens": [ + 50712, + 13089, + 9257, + 13127, + 21647, + 8040, + 4824, + 2474, + 31327, + 16680, + 10825, + 7588, + 12376, + 3384, + 9991, + 3193, + 4108, + 220, + 16158, + 8623, + 13127, + 3193, + 8822, + 23131, + 13876, + 5708, + 5998, + 8822, + 22979, + 23607, + 8040, + 7588, + 18593, + 12376, + 13258, + 9550, + 2972, + 51044 + ], + "temperature": 0.0, + "avg_logprob": -0.4399989651095483, + "compression_ratio": 1.6122448979591837, + "no_speech_prob": 0.18976199626922607, + "confidence": 0.525, + "words": [ + { + "text": "同", + "start": 6.94, + "end": 7.28, + "confidence": 0.469 + }, + { + "text": "じ", + "start": 7.28, + "end": 7.44, + "confidence": 0.218 + }, + { + "text": "度", + "start": 7.44, + "end": 7.62, + "confidence": 0.139 + }, + { + "text": "メ", + "start": 7.62, + "end": 7.74, + "confidence": 0.209 + }, + { + "text": "イ", + "start": 7.74, + "end": 7.82, + "confidence": 0.904 + }, + { + "text": "ン", + "start": 7.82, + "end": 7.84, + "confidence": 0.911 + }, + { + "text": "で", + "start": 7.84, + "end": 8.0, + "confidence": 0.979 + }, + { + "text": "デ", + "start": 8.0, + "end": 8.14, + "confidence": 0.37 + }, + { + "text": "レ", + "start": 8.14, + "end": 8.28, + "confidence": 0.674 + }, + { + "text": "ク", + "start": 8.28, + "end": 8.36, + "confidence": 0.974 + }, + { + "text": "ト", + "start": 8.36, + "end": 8.5, + "confidence": 0.979 + }, + { + "text": "リ", + "start": 8.5, + "end": 8.62, + "confidence": 0.96 + }, + { + "text": "ー", + "start": 8.62, + "end": 8.72, + "confidence": 0.701 + }, + { + "text": "ご", + "start": 8.72, + "end": 8.86, + "confidence": 0.267 + }, + { + "text": "と", + "start": 8.86, + "end": 9.0, + "confidence": 0.993 + }, + { + "text": "に", + "start": 9.0, + "end": 9.14, + "confidence": 0.967 + }, + { + "text": " ", + "start": 9.14, + "end": 9.34, + "confidence": 0.12 + }, + { + "text": "別", + "start": 9.34, + "end": 9.4, + "confidence": 0.527 + }, + { + "text": "再", + "start": 9.4, + "end": 9.58, + "confidence": 0.341 + }, + { + "text": "度", + "start": 9.58, + "end": 9.74, + "confidence": 0.323 + }, + { + "text": "と", + "start": 9.74, + "end": 9.92, + "confidence": 0.891 + }, + { + "text": "して", + "start": 9.92, + "end": 10.4, + "confidence": 0.998 + }, + { + "text": "管", + "start": 10.4, + "end": 10.86, + "confidence": 0.418 + }, + { + "text": "理", + "start": 10.86, + "end": 11.08, + "confidence": 1.0 + }, + { + "text": "上", + "start": 11.08, + "end": 11.36, + "confidence": 0.472 + }, + { + "text": "を", + "start": 11.36, + "end": 11.56, + "confidence": 0.987 + }, + { + "text": "して", + "start": 11.56, + "end": 11.84, + "confidence": 0.931 + }, + { + "text": "いる", + "start": 11.84, + "end": 12.16, + "confidence": 0.939 + }, + { + "text": "サ", + "start": 12.16, + "end": 12.52, + "confidence": 0.069 + }, + { + "text": "イ", + "start": 12.52, + "end": 12.58, + "confidence": 0.985 + }, + { + "text": "ト", + "start": 12.58, + "end": 12.7, + "confidence": 0.976 + }, + { + "text": "バ", + "start": 12.7, + "end": 12.82, + "confidence": 0.297 + }, + { + "text": "リ", + "start": 12.82, + "end": 12.96, + "confidence": 0.362 + }, + { + "text": "マ", + "start": 12.96, + "end": 13.12, + "confidence": 0.19 + }, + { + "text": "ス", + "start": 13.12, + "end": 13.22, + "confidence": 0.859 + }, + { + "text": "の", + "start": 13.22, + "end": 13.58, + "confidence": 0.701 + } + ] + }, + { + "id": 2, + "seek": 0, + "start": 13.68, + "end": 20.74, + "text": "サプテレクトリーごとにわけたサイトは それぞれ パブリシャーセンターに登録していくぐるニュース上では", + "tokens": [ + 51044, + 23607, + 20953, + 22985, + 16680, + 10825, + 7588, + 12376, + 3384, + 9991, + 3193, + 4108, + 9206, + 7625, + 3368, + 23607, + 8040, + 7588, + 3065, + 47765, + 31563, + 4132, + 15096, + 239, + 28889, + 12376, + 11054, + 17233, + 3384, + 31223, + 4824, + 30736, + 4108, + 46246, + 8822, + 49394, + 35849, + 4895, + 34737, + 26167, + 3384, + 9550, + 5708, + 16719, + 51408 + ], + "temperature": 0.0, + "avg_logprob": -0.4399989651095483, + "compression_ratio": 1.6122448979591837, + "no_speech_prob": 0.18976199626922607, + "confidence": 0.622, + "words": [ + { + "text": "サ", + "start": 13.68, + "end": 14.22, + "confidence": 0.397 + }, + { + "text": "プ", + "start": 14.22, + "end": 14.32, + "confidence": 0.532 + }, + { + "text": "テ", + "start": 14.32, + "end": 14.42, + "confidence": 0.637 + }, + { + "text": "レ", + "start": 14.42, + "end": 14.58, + "confidence": 0.825 + }, + { + "text": "ク", + "start": 14.58, + "end": 14.66, + "confidence": 0.474 + }, + { + "text": "ト", + "start": 14.66, + "end": 14.78, + "confidence": 0.973 + }, + { + "text": "リ", + "start": 14.78, + "end": 14.92, + "confidence": 0.873 + }, + { + "text": "ー", + "start": 14.92, + "end": 15.04, + "confidence": 0.917 + }, + { + "text": "ご", + "start": 15.04, + "end": 15.1, + "confidence": 0.016 + }, + { + "text": "と", + "start": 15.1, + "end": 15.38, + "confidence": 0.991 + }, + { + "text": "に", + "start": 15.38, + "end": 15.86, + "confidence": 0.493 + }, + { + "text": "わ", + "start": 15.86, + "end": 16.02, + "confidence": 0.756 + }, + { + "text": "け", + "start": 16.02, + "end": 16.14, + "confidence": 0.988 + }, + { + "text": "た", + "start": 16.14, + "end": 16.28, + "confidence": 0.951 + }, + { + "text": "サ", + "start": 16.28, + "end": 16.42, + "confidence": 0.802 + }, + { + "text": "イ", + "start": 16.42, + "end": 16.5, + "confidence": 0.981 + }, + { + "text": "ト", + "start": 16.5, + "end": 16.6, + "confidence": 0.904 + }, + { + "text": "は", + "start": 16.6, + "end": 17.08, + "confidence": 0.976 + }, + { + "text": " それ", + "start": 17.08, + "end": 17.44, + "confidence": 0.128 + }, + { + "text": "ぞ", + "start": 17.44, + "end": 17.6, + "confidence": 0.85 + }, + { + "text": "れ", + "start": 17.6, + "end": 17.72, + "confidence": 0.995 + }, + { + "text": " パ", + "start": 17.72, + "end": 17.86, + "confidence": 0.177 + }, + { + "text": "ブ", + "start": 17.86, + "end": 17.94, + "confidence": 0.941 + }, + { + "text": "リ", + "start": 17.94, + "end": 18.04, + "confidence": 0.991 + }, + { + "text": "シ", + "start": 18.04, + "end": 18.18, + "confidence": 0.755 + }, + { + "text": "ャ", + "start": 18.18, + "end": 18.26, + "confidence": 0.825 + }, + { + "text": "ー", + "start": 18.26, + "end": 18.42, + "confidence": 0.765 + }, + { + "text": "セ", + "start": 18.42, + "end": 18.44, + "confidence": 0.588 + }, + { + "text": "ン", + "start": 18.44, + "end": 18.52, + "confidence": 0.832 + }, + { + "text": "ター", + "start": 18.52, + "end": 18.6, + "confidence": 0.998 + }, + { + "text": "に", + "start": 18.6, + "end": 18.76, + "confidence": 0.858 + }, + { + "text": "登録", + "start": 18.76, + "end": 19.12, + "confidence": 0.902 + }, + { + "text": "して", + "start": 19.12, + "end": 19.38, + "confidence": 0.766 + }, + { + "text": "いく", + "start": 19.38, + "end": 19.62, + "confidence": 0.877 + }, + { + "text": "ぐ", + "start": 19.62, + "end": 19.78, + "confidence": 0.221 + }, + { + "text": "る", + "start": 19.78, + "end": 19.9, + "confidence": 0.85 + }, + { + "text": "ニ", + "start": 19.9, + "end": 20.02, + "confidence": 0.68 + }, + { + "text": "ュ", + "start": 20.02, + "end": 20.14, + "confidence": 0.996 + }, + { + "text": "ー", + "start": 20.14, + "end": 20.16, + "confidence": 0.989 + }, + { + "text": "ス", + "start": 20.16, + "end": 20.22, + "confidence": 0.982 + }, + { + "text": "上", + "start": 20.22, + "end": 20.4, + "confidence": 0.236 + }, + { + "text": "では", + "start": 20.4, + "end": 20.74, + "confidence": 0.763 + } + ] + }, + { + "id": 3, + "seek": 2088, + "start": 20.9, + "end": 27.0, + "text": "サイトとして認識され パブリコンアイコンはサイトボトフのものが 正しく表示されます", + "tokens": [ + 50364, + 23607, + 8040, + 7588, + 3193, + 8822, + 22041, + 43143, + 6722, + 4132, + 15096, + 239, + 28889, + 12376, + 18066, + 4824, + 12817, + 8040, + 18066, + 4824, + 3065, + 23607, + 8040, + 7588, + 37626, + 7588, + 17320, + 2972, + 44726, + 5142, + 220, + 15789, + 26568, + 40053, + 6722, + 4132, + 5368, + 50684 + ], + "temperature": 0.0, + "avg_logprob": -0.35158648256395686, + "compression_ratio": 1.6926406926406927, + "no_speech_prob": 0.06365812569856644, + "confidence": 0.389, + "words": [ + { + "text": "サ", + "start": 20.9, + "end": 21.26, + "confidence": 0.002 + }, + { + "text": "イ", + "start": 21.26, + "end": 21.34, + "confidence": 0.939 + }, + { + "text": "ト", + "start": 21.34, + "end": 21.44, + "confidence": 0.379 + }, + { + "text": "と", + "start": 21.44, + "end": 21.58, + "confidence": 0.831 + }, + { + "text": "して", + "start": 21.58, + "end": 21.8, + "confidence": 0.981 + }, + { + "text": "認", + "start": 21.8, + "end": 22.08, + "confidence": 0.179 + }, + { + "text": "識", + "start": 22.08, + "end": 22.2, + "confidence": 0.986 + }, + { + "text": "さ", + "start": 22.2, + "end": 22.34, + "confidence": 0.982 + }, + { + "text": "れ", + "start": 22.34, + "end": 22.64, + "confidence": 0.948 + }, + { + "text": " パ", + "start": 22.64, + "end": 22.86, + "confidence": 0.141 + }, + { + "text": "ブ", + "start": 22.86, + "end": 23.0, + "confidence": 0.051 + }, + { + "text": "リ", + "start": 23.0, + "end": 23.18, + "confidence": 0.007 + }, + { + "text": "コ", + "start": 23.18, + "end": 23.22, + "confidence": 0.817 + }, + { + "text": "ン", + "start": 23.22, + "end": 23.3, + "confidence": 0.887 + }, + { + "text": "ア", + "start": 23.3, + "end": 23.46, + "confidence": 0.107 + }, + { + "text": "イ", + "start": 23.46, + "end": 23.52, + "confidence": 0.957 + }, + { + "text": "コ", + "start": 23.52, + "end": 23.64, + "confidence": 0.308 + }, + { + "text": "ン", + "start": 23.64, + "end": 23.86, + "confidence": 0.893 + }, + { + "text": "は", + "start": 23.86, + "end": 23.88, + "confidence": 0.834 + }, + { + "text": "サ", + "start": 23.88, + "end": 24.04, + "confidence": 0.642 + }, + { + "text": "イ", + "start": 24.04, + "end": 24.16, + "confidence": 0.997 + }, + { + "text": "ト", + "start": 24.16, + "end": 24.24, + "confidence": 0.989 + }, + { + "text": "ボ", + "start": 24.24, + "end": 24.38, + "confidence": 0.588 + }, + { + "text": "ト", + "start": 24.38, + "end": 24.52, + "confidence": 0.861 + }, + { + "text": "フ", + "start": 24.52, + "end": 24.66, + "confidence": 0.037 + }, + { + "text": "の", + "start": 24.66, + "end": 24.72, + "confidence": 0.66 + }, + { + "text": "もの", + "start": 24.72, + "end": 24.9, + "confidence": 0.501 + }, + { + "text": "が", + "start": 24.9, + "end": 25.08, + "confidence": 0.338 + }, + { + "text": " ", + "start": 25.08, + "end": 25.32, + "confidence": 0.283 + }, + { + "text": "正", + "start": 25.32, + "end": 25.4, + "confidence": 0.631 + }, + { + "text": "しく", + "start": 25.4, + "end": 25.66, + "confidence": 0.979 + }, + { + "text": "表示", + "start": 25.66, + "end": 26.0, + "confidence": 0.665 + }, + { + "text": "さ", + "start": 26.0, + "end": 26.28, + "confidence": 0.993 + }, + { + "text": "れ", + "start": 26.28, + "end": 26.6, + "confidence": 0.986 + }, + { + "text": "ます", + "start": 26.6, + "end": 27.0, + "confidence": 0.888 + } + ] + }, + { + "id": 4, + "seek": 2088, + "start": 27.28, + "end": 33.8, + "text": "しかし ルグル検査結果のニュースタブでは パブリコンサイトメイショー機ともに 正しくない医療時にいいなります", + "tokens": [ + 50684, + 32156, + 2849, + 220, + 9405, + 23839, + 9405, + 38739, + 250, + 17238, + 119, + 35181, + 2972, + 34737, + 26167, + 3384, + 9550, + 12144, + 28889, + 16719, + 15096, + 239, + 28889, + 12376, + 18066, + 4824, + 23607, + 8040, + 7588, + 21647, + 8040, + 43891, + 3384, + 17543, + 3193, + 4801, + 4108, + 220, + 15789, + 26568, + 9311, + 9937, + 119, + 6651, + 224, + 6611, + 4108, + 13806, + 3203, + 19420, + 51024 + ], + "temperature": 0.0, + "avg_logprob": -0.35158648256395686, + "compression_ratio": 1.6926406926406927, + "no_speech_prob": 0.06365812569856644, + "confidence": 0.502, + "words": [ + { + "text": "しか", + "start": 27.28, + "end": 27.58, + "confidence": 0.909 + }, + { + "text": "し", + "start": 27.58, + "end": 27.72, + "confidence": 0.989 + }, + { + "text": " ", + "start": 27.72, + "end": 27.86, + "confidence": 0.065 + }, + { + "text": "ル", + "start": 27.86, + "end": 27.9, + "confidence": 0.236 + }, + { + "text": "グ", + "start": 27.9, + "end": 28.0, + "confidence": 0.538 + }, + { + "text": "ル", + "start": 28.0, + "end": 28.14, + "confidence": 0.989 + }, + { + "text": "検", + "start": 28.14, + "end": 28.32, + "confidence": 0.565 + }, + { + "text": "査", + "start": 28.32, + "end": 28.46, + "confidence": 0.728 + }, + { + "text": "結果", + "start": 28.46, + "end": 28.72, + "confidence": 0.976 + }, + { + "text": "の", + "start": 28.72, + "end": 28.92, + "confidence": 0.96 + }, + { + "text": "ニ", + "start": 28.92, + "end": 29.06, + "confidence": 0.777 + }, + { + "text": "ュ", + "start": 29.06, + "end": 29.14, + "confidence": 0.995 + }, + { + "text": "ー", + "start": 29.14, + "end": 29.2, + "confidence": 0.98 + }, + { + "text": "ス", + "start": 29.2, + "end": 29.26, + "confidence": 0.971 + }, + { + "text": "タ", + "start": 29.26, + "end": 29.34, + "confidence": 0.806 + }, + { + "text": "ブ", + "start": 29.34, + "end": 29.44, + "confidence": 0.685 + }, + { + "text": "では", + "start": 29.44, + "end": 29.68, + "confidence": 0.942 + }, + { + "text": " パ", + "start": 29.68, + "end": 30.02, + "confidence": 0.123 + }, + { + "text": "ブ", + "start": 30.02, + "end": 30.14, + "confidence": 0.041 + }, + { + "text": "リ", + "start": 30.14, + "end": 30.32, + "confidence": 0.021 + }, + { + "text": "コ", + "start": 30.32, + "end": 30.34, + "confidence": 0.89 + }, + { + "text": "ン", + "start": 30.34, + "end": 30.42, + "confidence": 0.918 + }, + { + "text": "サ", + "start": 30.42, + "end": 30.54, + "confidence": 0.426 + }, + { + "text": "イ", + "start": 30.54, + "end": 30.62, + "confidence": 0.979 + }, + { + "text": "ト", + "start": 30.62, + "end": 30.72, + "confidence": 0.956 + }, + { + "text": "メ", + "start": 30.72, + "end": 30.86, + "confidence": 0.251 + }, + { + "text": "イ", + "start": 30.86, + "end": 30.92, + "confidence": 0.622 + }, + { + "text": "ショ", + "start": 30.92, + "end": 31.02, + "confidence": 0.416 + }, + { + "text": "ー", + "start": 31.02, + "end": 31.08, + "confidence": 0.618 + }, + { + "text": "機", + "start": 31.08, + "end": 31.24, + "confidence": 0.126 + }, + { + "text": "と", + "start": 31.24, + "end": 31.42, + "confidence": 0.357 + }, + { + "text": "も", + "start": 31.42, + "end": 31.54, + "confidence": 0.81 + }, + { + "text": "に", + "start": 31.54, + "end": 31.66, + "confidence": 0.919 + }, + { + "text": " ", + "start": 31.66, + "end": 31.8, + "confidence": 0.402 + }, + { + "text": "正", + "start": 31.8, + "end": 31.96, + "confidence": 0.437 + }, + { + "text": "しく", + "start": 31.96, + "end": 32.18, + "confidence": 0.998 + }, + { + "text": "ない", + "start": 32.18, + "end": 32.4, + "confidence": 0.981 + }, + { + "text": "医", + "start": 32.4, + "end": 32.6, + "confidence": 0.234 + }, + { + "text": "療", + "start": 32.6, + "end": 32.76, + "confidence": 0.686 + }, + { + "text": "時", + "start": 32.76, + "end": 32.96, + "confidence": 0.452 + }, + { + "text": "に", + "start": 32.96, + "end": 33.12, + "confidence": 0.925 + }, + { + "text": "いい", + "start": 33.12, + "end": 33.36, + "confidence": 0.577 + }, + { + "text": "な", + "start": 33.36, + "end": 33.48, + "confidence": 0.807 + }, + { + "text": "ります", + "start": 33.48, + "end": 33.8, + "confidence": 0.941 + } + ] + }, + { + "id": 5, + "seek": 2088, + "start": 34.04, + "end": 40.36, + "text": "こちらいたいです ものではありません パブリコンはサブテレクトリーごとに設定した", + "tokens": [ + 51024, + 34395, + 17679, + 1764, + 4767, + 32505, + 2972, + 16719, + 14498, + 30250, + 15096, + 239, + 28889, + 12376, + 18066, + 4824, + 3065, + 23607, + 28889, + 22985, + 16680, + 10825, + 7588, + 12376, + 3384, + 9991, + 3193, + 4108, + 39035, + 12088, + 8533, + 51388 + ], + "temperature": 0.0, + "avg_logprob": -0.35158648256395686, + "compression_ratio": 1.6926406926406927, + "no_speech_prob": 0.06365812569856644, + "confidence": 0.364, + "words": [ + { + "text": "こちら", + "start": 34.04, + "end": 34.54, + "confidence": 0.408 + }, + { + "text": "いた", + "start": 34.54, + "end": 34.82, + "confidence": 0.254 + }, + { + "text": "い", + "start": 34.82, + "end": 34.98, + "confidence": 0.11 + }, + { + "text": "です", + "start": 34.98, + "end": 35.04, + "confidence": 0.021 + }, + { + "text": " も", + "start": 35.04, + "end": 35.18, + "confidence": 0.009 + }, + { + "text": "の", + "start": 35.18, + "end": 35.28, + "confidence": 0.812 + }, + { + "text": "では", + "start": 35.28, + "end": 35.5, + "confidence": 0.995 + }, + { + "text": "あり", + "start": 35.5, + "end": 35.72, + "confidence": 0.981 + }, + { + "text": "ません", + "start": 35.72, + "end": 36.18, + "confidence": 0.999 + }, + { + "text": " パ", + "start": 36.18, + "end": 36.9, + "confidence": 0.273 + }, + { + "text": "ブ", + "start": 36.9, + "end": 37.02, + "confidence": 0.011 + }, + { + "text": "リ", + "start": 37.02, + "end": 37.1, + "confidence": 0.237 + }, + { + "text": "コ", + "start": 37.1, + "end": 37.18, + "confidence": 0.951 + }, + { + "text": "ン", + "start": 37.18, + "end": 37.84, + "confidence": 0.832 + }, + { + "text": "は", + "start": 37.84, + "end": 37.86, + "confidence": 0.95 + }, + { + "text": "サ", + "start": 37.86, + "end": 38.22, + "confidence": 0.307 + }, + { + "text": "ブ", + "start": 38.22, + "end": 38.32, + "confidence": 0.98 + }, + { + "text": "テ", + "start": 38.32, + "end": 38.42, + "confidence": 0.318 + }, + { + "text": "レ", + "start": 38.42, + "end": 38.56, + "confidence": 0.394 + }, + { + "text": "ク", + "start": 38.56, + "end": 38.66, + "confidence": 0.751 + }, + { + "text": "ト", + "start": 38.66, + "end": 38.78, + "confidence": 0.731 + }, + { + "text": "リ", + "start": 38.78, + "end": 38.92, + "confidence": 0.988 + }, + { + "text": "ー", + "start": 38.92, + "end": 38.96, + "confidence": 0.528 + }, + { + "text": "ご", + "start": 38.96, + "end": 39.08, + "confidence": 0.051 + }, + { + "text": "と", + "start": 39.08, + "end": 39.24, + "confidence": 0.973 + }, + { + "text": "に", + "start": 39.24, + "end": 39.52, + "confidence": 0.978 + }, + { + "text": "設", + "start": 39.52, + "end": 39.84, + "confidence": 0.621 + }, + { + "text": "定", + "start": 39.84, + "end": 40.04, + "confidence": 0.996 + }, + { + "text": "した", + "start": 40.04, + "end": 40.36, + "confidence": 0.894 + } + ] + } + ], + "language": "Japanese" +} \ No newline at end of file diff --git a/tests/expected/tiny_auto/bonjour.wav.words.json b/tests/expected/tiny_auto/bonjour.wav.words.json new file mode 100644 index 0000000000000000000000000000000000000000..d20b7b91e5bc59af96ae7a92889c21d219960337 --- /dev/null +++ b/tests/expected/tiny_auto/bonjour.wav.words.json @@ -0,0 +1,133 @@ +{ + "text": " Bonjour !", + "segments": [ + { + "id": 0, + "seek": 0, + "start": 0.14, + "end": 0.96, + "text": " Bonjour !", + "tokens": [ + 50364, + 25431, + 2298, + 50414 + ], + "temperature": 0.0, + "avg_logprob": -0.6977285861968994, + "compression_ratio": 0.5294117647058824, + "no_speech_prob": 0.019094161689281464, + "confidence": 0.829, + "words": [ + { + "text": "Bonjour !", + "start": 0.14, + "end": 0.96, + "confidence": 0.829 + } + ] + } + ], + "language": "fr", + "language_probs": { + "en": 0.007364001125097275, + "zh": 0.041395243257284164, + "de": 0.0015925770858302712, + "es": 0.0021767946891486645, + "ru": 0.10325776785612106, + "ko": 0.006601048167794943, + "fr": 0.4052142798900604, + "ja": 0.0019210146274417639, + "pt": 0.33332017064094543, + "tr": 0.007421758491545916, + "pl": 0.05315254256129265, + "ca": 6.396045500878245e-05, + "nl": 0.0077174073085188866, + "ar": 0.001450057839974761, + "sv": 0.0062011112459003925, + "it": 0.0026052820030599833, + "id": 0.0002559504355303943, + "hi": 0.00036094794631935656, + "fi": 5.62248460482806e-05, + "vi": 0.0011927851010113955, + "he": 0.0003260892990510911, + "uk": 0.0017354920273646712, + "el": 0.00019095065363217145, + "ms": 0.0005904714344069362, + "cs": 0.0007178307278081775, + "ro": 0.0009003614541143179, + "da": 0.0001010177584248595, + "hu": 8.880029781721532e-05, + "ta": 7.943290256662294e-06, + "no": 0.000378270196961239, + "th": 5.119330307934433e-05, + "ur": 0.00023213693930301815, + "hr": 0.0004253006190992892, + "bg": 0.0004319981671869755, + "lt": 0.0001386153162457049, + "la": 0.0008864026167429984, + "mi": 5.62248460482806e-05, + "ml": 3.6652261314884527e-06, + "cy": 0.0005050569889135659, + "sk": 0.0006384518346749246, + "te": 1.9506836906657554e-05, + "fa": 0.00011627071216935292, + "lv": 2.100969140883535e-05, + "bn": 3.5322318581165746e-05, + "sr": 0.00010141311940969899, + "az": 3.2924017432378605e-05, + "sl": 0.0004972267779521644, + "kn": 1.1376539532648167e-06, + "et": 3.886401827912778e-06, + "mk": 4.178275776212104e-05, + "br": 0.001669006422162056, + "eu": 5.513735595741309e-05, + "is": 9.506873539066873e-06, + "hy": 4.2434403439983726e-06, + "ne": 3.3047945180442184e-06, + "mn": 3.559935430530459e-05, + "bs": 0.0002661463222466409, + "kk": 1.3045214473095257e-05, + "sq": 0.00017049974121619016, + "sw": 3.068856312893331e-05, + "gl": 0.00019395769049879164, + "mr": 2.1512002490453597e-07, + "pa": 2.8322670004854444e-06, + "si": 2.838228283508215e-05, + "km": 0.00015223913942463696, + "sn": 0.00028110656421631575, + "yo": 0.0003637789050117135, + "so": 8.307013672492758e-07, + "af": 2.2277508833212778e-05, + "oc": 0.0004253006190992892, + "ka": 1.5580286572003388e-06, + "be": 0.00017318472964689136, + "tg": 2.0718216831028258e-07, + "sd": 3.5322318581165746e-05, + "gu": 8.50400795116002e-07, + "am": 2.665870624696254e-06, + "yi": 2.8604887120309286e-05, + "lo": 1.2943694855493959e-05, + "uz": 1.491831658206877e-09, + "fo": 5.892313129152171e-05, + "ht": 0.00017938153177965432, + "ps": 9.036155461217277e-06, + "tk": 1.281216821524822e-08, + "nn": 0.0024094919208437204, + "mt": 8.099957085505594e-06, + "sa": 5.600564327323809e-05, + "lb": 6.14076256510998e-08, + "my": 3.849208223982714e-05, + "bo": 9.126193617703393e-05, + "tl": 6.483123797806911e-06, + "mg": 1.4993576158417454e-08, + "as": 2.3480320123780984e-06, + "tt": 1.376765368377164e-07, + "haw": 0.0002519823028706014, + "ln": 2.1592100893030874e-05, + "ha": 7.02048819078982e-09, + "ba": 1.902783886009729e-08, + "jw": 0.0002855333441402763, + "su": 9.264376821249698e-09 + } +} \ No newline at end of file diff --git a/tests/expected/tiny_auto/bonjour_vous_allez_bien.mp3.words.json b/tests/expected/tiny_auto/bonjour_vous_allez_bien.mp3.words.json new file mode 100644 index 0000000000000000000000000000000000000000..8ba2f58d60ffd0cfbf7a7dd0c3fc0e4187d7ddeb --- /dev/null +++ b/tests/expected/tiny_auto/bonjour_vous_allez_bien.mp3.words.json @@ -0,0 +1,255 @@ +{ + "text": " Боже улыл! Эскому зарегиан! Боже улыл! Эскому зарегиан!", + "segments": [ + { + "id": 0, + "seek": 0, + "start": 0.44, + "end": 1.88, + "text": " Боже улыл!", + "tokens": [ + 50364, + 5697, + 9292, + 1595, + 30975, + 693, + 0, + 50464 + ], + "temperature": 0.0, + "avg_logprob": -0.9443809107730263, + "compression_ratio": 0.8166666666666667, + "no_speech_prob": 0.04302893579006195, + "confidence": 0.317, + "words": [ + { + "text": "Боже", + "start": 0.44, + "end": 0.86, + "confidence": 0.423 + }, + { + "text": "улыл!", + "start": 0.86, + "end": 1.88, + "confidence": 0.261 + } + ] + }, + { + "id": 1, + "seek": 0, + "start": 1.88, + "end": 3.14, + "text": " Эскому зарегиан!", + "tokens": [ + 50464, + 5381, + 4218, + 4161, + 17821, + 4953, + 435, + 1416, + 0, + 50564 + ], + "temperature": 0.0, + "avg_logprob": -0.9443809107730263, + "compression_ratio": 0.8166666666666667, + "no_speech_prob": 0.04302893579006195, + "confidence": 0.395, + "words": [ + { + "text": "Эскому", + "start": 1.88, + "end": 2.3, + "confidence": 0.286 + }, + { + "text": "зарегиан!", + "start": 2.3, + "end": 3.14, + "confidence": 0.505 + } + ] + }, + { + "id": 2, + "seek": 3000, + "start": 32.98, + "end": 34.02, + "text": " Боже улыл!", + "tokens": [ + 50364, + 5697, + 9292, + 1595, + 30975, + 693, + 0, + 50564 + ], + "temperature": 0.0, + "avg_logprob": -0.3071819355613307, + "compression_ratio": 0.8166666666666667, + "no_speech_prob": 0.2232234627008438, + "confidence": 0.577, + "words": [ + { + "text": "Боже", + "start": 32.98, + "end": 33.36, + "confidence": 0.446 + }, + { + "text": "улыл!", + "start": 33.36, + "end": 34.02, + "confidence": 0.686 + } + ] + }, + { + "id": 3, + "seek": 3000, + "start": 34.42, + "end": 35.72, + "text": " Эскому зарегиан!", + "tokens": [ + 50564, + 5381, + 4218, + 4161, + 17821, + 4953, + 435, + 1416, + 0, + 50664 + ], + "temperature": 0.0, + "avg_logprob": -0.3071819355613307, + "compression_ratio": 0.8166666666666667, + "no_speech_prob": 0.2232234627008438, + "confidence": 0.849, + "words": [ + { + "text": "Эскому", + "start": 34.42, + "end": 34.84, + "confidence": 0.691 + }, + { + "text": "зарегиан!", + "start": 34.84, + "end": 35.72, + "confidence": 0.992 + } + ] + } + ], + "language": "ru", + "language_probs": { + "en": 0.05109040066599846, + "zh": 0.0006792841013520956, + "de": 0.0007287654443643987, + "es": 0.01429856475442648, + "ru": 0.5119792819023132, + "ko": 0.0008257994195446372, + "fr": 0.021297650411725044, + "ja": 0.001567091909237206, + "pt": 0.2036512941122055, + "tr": 0.0052192131988704205, + "pl": 0.10648154467344284, + "ca": 0.00012226558465044945, + "nl": 0.008672517724335194, + "ar": 0.0009284712723456323, + "sv": 0.0007879833574406803, + "it": 0.0003537872398737818, + "id": 0.00035935858613811433, + "hi": 3.0913583032088354e-05, + "fi": 7.021122291916981e-05, + "vi": 3.714352715178393e-05, + "he": 0.00010457931057317182, + "uk": 0.00486484169960022, + "el": 0.00486484169960022, + "ms": 0.0002489204052835703, + "cs": 0.0018037117552012205, + "ro": 0.0008388038841076195, + "da": 1.0725262654887047e-05, + "hu": 0.0007637396920472383, + "ta": 3.6562209970725235e-06, + "no": 0.0001316852285526693, + "th": 1.203341184918827e-06, + "ur": 0.00010581205424387008, + "hr": 0.0008453827467747033, + "bg": 0.007534814067184925, + "lt": 0.00010581205424387008, + "la": 0.002408271422609687, + "mi": 6.268220658967039e-06, + "ml": 4.929601345793344e-06, + "cy": 0.000450736639322713, + "sk": 0.0019200412789359689, + "te": 1.409809283359209e-05, + "fa": 6.318325904430822e-05, + "lv": 9.672004671301693e-05, + "bn": 2.209294143540319e-05, + "sr": 0.00021542265312746167, + "az": 5.341388168744743e-05, + "sl": 0.0004969748551957309, + "kn": 5.667552613886073e-07, + "et": 3.4956110539496876e-06, + "mk": 0.0002403213584329933, + "br": 0.0026866206899285316, + "eu": 4.677075776271522e-05, + "is": 5.4680560424458236e-05, + "hy": 4.1673874875414185e-06, + "ne": 1.0363322644479922e-06, + "mn": 9.958069313142914e-06, + "bs": 0.00044374860590323806, + "kk": 1.220088051923085e-05, + "sq": 0.00021881508291698992, + "sw": 1.3558002137870062e-05, + "gl": 0.0006635484169237316, + "mr": 8.262362030109216e-07, + "pa": 1.8348761159359128e-06, + "si": 0.00010457931057317182, + "km": 0.00046869192738085985, + "sn": 0.00016134412726387382, + "yo": 0.00029444784740917385, + "so": 4.1667655636956624e-07, + "af": 1.9119846911053173e-05, + "oc": 0.0002670526155270636, + "ka": 6.517918791359989e-06, + "be": 0.00028762698639184237, + "tg": 3.018845688984584e-07, + "sd": 1.2836458154197317e-05, + "gu": 2.184769272162157e-07, + "am": 1.0373449867984164e-06, + "yi": 0.00014072682824917138, + "lo": 9.43591373925301e-07, + "uz": 1.9715000743047995e-09, + "fo": 8.352842087333556e-06, + "ht": 4.658841862692498e-05, + "ps": 3.831686626654118e-06, + "tk": 1.198291865733836e-08, + "nn": 0.03350590169429779, + "mt": 1.2393017641443294e-05, + "sa": 6.752147601218894e-05, + "lb": 8.849924171272505e-08, + "my": 2.0073605355719337e-06, + "bo": 4.703858849097742e-06, + "tl": 7.429171546391444e-06, + "mg": 8.09222822084621e-09, + "as": 1.8674148805075674e-06, + "tt": 9.030228511619498e-07, + "haw": 0.0020279677119106054, + "ln": 7.2146781349147204e-06, + "ha": 3.7193925717105003e-09, + "ba": 1.6799896584984708e-08, + "jw": 0.0009730295278131962, + "su": 1.2147872929801906e-08 + } +} \ No newline at end of file diff --git a/tests/expected/tiny_auto/empty.mp3.words.json b/tests/expected/tiny_auto/empty.mp3.words.json new file mode 100644 index 0000000000000000000000000000000000000000..44c624e28480469c66fd29b1192e68a3a82f1904 --- /dev/null +++ b/tests/expected/tiny_auto/empty.mp3.words.json @@ -0,0 +1,106 @@ +{ + "text": "", + "segments": [], + "language": "en", + "language_probs": { + "en": 0.481865257024765, + "zh": 0.018109099939465523, + "de": 0.013043494895100594, + "es": 0.011969382874667645, + "ru": 0.01839427463710308, + "ko": 0.05078822001814842, + "fr": 0.019888954237103462, + "ja": 0.06370270252227783, + "pt": 0.009542823769152164, + "tr": 0.002145992126315832, + "pl": 0.01648852229118347, + "ca": 0.00040956982411444187, + "nl": 0.008226429112255573, + "ar": 0.001984718255698681, + "sv": 0.0016844086349010468, + "it": 0.0077886260114610195, + "id": 0.0019387423526495695, + "hi": 0.0013964237878099084, + "fi": 0.0012615637388080359, + "vi": 0.0008145267493091524, + "he": 0.000482591160107404, + "uk": 0.000624519307166338, + "el": 0.0008145267493091524, + "ms": 0.002820853376761079, + "cs": 0.0010377340950071812, + "ro": 0.0007533141179010272, + "da": 0.00025036497390829027, + "hu": 0.0009672744781710207, + "ta": 0.00022094632731750607, + "no": 0.00029270630329847336, + "th": 0.0009748608572408557, + "ur": 0.0001483363303123042, + "hr": 0.00012887685443274677, + "bg": 0.0003877728886436671, + "lt": 2.365429827477783e-05, + "la": 0.015856856480240822, + "mi": 0.0006443436723202467, + "ml": 0.0004979101940989494, + "cy": 0.00882566999644041, + "sk": 0.00016940542263910174, + "te": 0.00014603660383727401, + "fa": 0.0002665121282916516, + "lv": 3.233158713555895e-05, + "bn": 0.0007711784564889967, + "sr": 4.023731162305921e-05, + "az": 2.9209157219156623e-05, + "sl": 0.00010274958185618743, + "kn": 1.463002718082862e-05, + "et": 2.9901832022005692e-05, + "mk": 1.9996876289951615e-05, + "br": 0.0027127882931381464, + "eu": 0.00014718198508489877, + "is": 4.087095658178441e-05, + "hy": 4.023731162305921e-05, + "ne": 3.414896491449326e-05, + "mn": 0.00015667440311517566, + "bs": 8.720243931747973e-05, + "kk": 1.0293509149050806e-05, + "sq": 3.037271926586982e-05, + "sw": 6.92527974024415e-05, + "gl": 0.000482591160107404, + "mr": 4.471296415431425e-05, + "pa": 1.7716249203658663e-05, + "si": 0.0001483363303123042, + "km": 0.0005912830238230526, + "sn": 0.00034489232348278165, + "yo": 0.00016677902021910995, + "so": 2.9491400255210465e-06, + "af": 6.111538095865399e-05, + "oc": 0.00018898540292866528, + "ka": 2.6182920919382013e-05, + "be": 6.0167876654304564e-05, + "tg": 1.8398510803763202e-07, + "sd": 3.1092986318981275e-05, + "gu": 1.0333797035855241e-05, + "am": 5.155722647032235e-06, + "yi": 8.25616079964675e-05, + "lo": 1.0914664926531259e-05, + "uz": 2.2382069531090565e-09, + "fo": 0.00017207316705025733, + "ht": 7.089507562341169e-05, + "ps": 1.2128717571613379e-05, + "tk": 1.972132324112863e-08, + "nn": 0.21719369292259216, + "mt": 1.3320791367732454e-05, + "sa": 0.0002484166470821947, + "lb": 1.790224075648439e-07, + "my": 0.00010274958185618743, + "bo": 4.4887969124829397e-05, + "tl": 0.0003642789088189602, + "mg": 2.4045375468517705e-08, + "as": 1.7441585441702046e-05, + "tt": 9.323910887815146e-08, + "haw": 0.0036504557356238365, + "ln": 6.170591859699925e-06, + "ha": 2.120961006824018e-08, + "ba": 1.7063216617430044e-08, + "jw": 0.003679086221382022, + "su": 3.741536147572333e-08 + } +} \ No newline at end of file diff --git a/tests/expected/tiny_auto/gaenswein15.mp3.words.json b/tests/expected/tiny_auto/gaenswein15.mp3.words.json new file mode 100644 index 0000000000000000000000000000000000000000..bf47cbea2c554abe6c88811b63d56b929eca013b --- /dev/null +++ b/tests/expected/tiny_auto/gaenswein15.mp3.words.json @@ -0,0 +1,438 @@ +{ + "text": " Wie wieder zu dazu ist Meshfuchs von 1962 als Meshale für die außerordentliche Form des grullischen Rätus ist dann nicht so weitergegangen wie sich Papstbälle dick das gewünscht hatte. Das hat er als Meshale im Rätus", + "segments": [ + { + "id": 0, + "seek": 0, + "start": 0.92, + "end": 8.04, + "text": " Wie wieder zu dazu ist Meshfuchs von 1962 als Meshale für die außerordentliche Form des grullischen", + "tokens": [ + 50364, + 9233, + 6216, + 2164, + 13034, + 1418, + 376, + 14935, + 69, + 37503, + 2957, + 39498, + 3907, + 376, + 14935, + 1220, + 2959, + 978, + 39428, + 765, + 7698, + 68, + 10126, + 730, + 677, + 858, + 6282, + 50764 + ], + "temperature": 0.0, + "avg_logprob": -0.6858572118422565, + "compression_ratio": 1.3293413173652695, + "no_speech_prob": 0.04553895816206932, + "confidence": 0.503, + "words": [ + { + "text": "Wie", + "start": 0.92, + "end": 1.1, + "confidence": 0.459 + }, + { + "text": "wieder", + "start": 1.1, + "end": 1.4, + "confidence": 0.891 + }, + { + "text": "zu", + "start": 1.4, + "end": 1.6, + "confidence": 0.283 + }, + { + "text": "dazu", + "start": 1.6, + "end": 1.92, + "confidence": 0.173 + }, + { + "text": "ist", + "start": 1.92, + "end": 2.14, + "confidence": 0.649 + }, + { + "text": "Meshfuchs", + "start": 2.14, + "end": 2.74, + "confidence": 0.333 + }, + { + "text": "von", + "start": 2.74, + "end": 3.22, + "confidence": 0.626 + }, + { + "text": "1962", + "start": 3.22, + "end": 4.84, + "confidence": 0.182 + }, + { + "text": "als", + "start": 4.84, + "end": 5.24, + "confidence": 0.883 + }, + { + "text": "Meshale", + "start": 5.24, + "end": 5.78, + "confidence": 0.389 + }, + { + "text": "für", + "start": 5.78, + "end": 5.92, + "confidence": 0.935 + }, + { + "text": "die", + "start": 5.92, + "end": 6.08, + "confidence": 0.973 + }, + { + "text": "außerordentliche", + "start": 6.08, + "end": 7.04, + "confidence": 0.898 + }, + { + "text": "Form", + "start": 7.04, + "end": 7.4, + "confidence": 0.64 + }, + { + "text": "des", + "start": 7.4, + "end": 7.62, + "confidence": 0.974 + }, + { + "text": "grullischen", + "start": 7.62, + "end": 8.04, + "confidence": 0.371 + } + ] + }, + { + "id": 1, + "seek": 0, + "start": 9.42, + "end": 12.78, + "text": " Rätus ist dann nicht so weitergegangen wie sich Papstbälle dick das gewünscht hatte.", + "tokens": [ + 50764, + 497, + 3628, + 301, + 1418, + 3594, + 1979, + 370, + 8988, + 432, + 47152, + 3355, + 3041, + 15919, + 372, + 65, + 31447, + 18659, + 1482, + 6906, + 3412, + 82, + 4701, + 13299, + 13, + 51014 + ], + "temperature": 0.0, + "avg_logprob": -0.6858572118422565, + "compression_ratio": 1.3293413173652695, + "no_speech_prob": 0.04553895816206932, + "confidence": 0.63, + "words": [ + { + "text": "Rätus", + "start": 9.42, + "end": 9.44, + "confidence": 0.381 + }, + { + "text": "ist", + "start": 9.44, + "end": 9.62, + "confidence": 0.897 + }, + { + "text": "dann", + "start": 9.62, + "end": 9.78, + "confidence": 0.586 + }, + { + "text": "nicht", + "start": 9.78, + "end": 9.96, + "confidence": 0.979 + }, + { + "text": "so", + "start": 9.96, + "end": 10.12, + "confidence": 0.991 + }, + { + "text": "weitergegangen", + "start": 10.12, + "end": 10.88, + "confidence": 0.703 + }, + { + "text": "wie", + "start": 10.88, + "end": 11.04, + "confidence": 0.77 + }, + { + "text": "sich", + "start": 11.04, + "end": 11.24, + "confidence": 0.968 + }, + { + "text": "Papstbälle", + "start": 11.24, + "end": 11.72, + "confidence": 0.453 + }, + { + "text": "dick", + "start": 11.72, + "end": 11.9, + "confidence": 0.249 + }, + { + "text": "das", + "start": 11.9, + "end": 12.08, + "confidence": 0.833 + }, + { + "text": "gewünscht", + "start": 12.08, + "end": 12.58, + "confidence": 0.801 + }, + { + "text": "hatte.", + "start": 12.58, + "end": 12.78, + "confidence": 0.906 + } + ] + }, + { + "id": 2, + "seek": 0, + "start": 14.0, + "end": 15.28, + "text": " Das hat er als Meshale im Rätus", + "tokens": [ + 51014, + 2846, + 2385, + 1189, + 3907, + 376, + 14935, + 1220, + 566, + 497, + 3628, + 301, + 51164 + ], + "temperature": 0.0, + "avg_logprob": -0.6858572118422565, + "compression_ratio": 1.3293413173652695, + "no_speech_prob": 0.04553895816206932, + "confidence": 0.409, + "words": [ + { + "text": "Das", + "start": 14.0, + "end": 14.2, + "confidence": 0.938 + }, + { + "text": "hat", + "start": 14.2, + "end": 14.4, + "confidence": 0.955 + }, + { + "text": "er", + "start": 14.4, + "end": 14.56, + "confidence": 0.736 + }, + { + "text": "als", + "start": 14.56, + "end": 14.7, + "confidence": 0.83 + }, + { + "text": "Meshale", + "start": 14.7, + "end": 15.1, + "confidence": 0.188 + }, + { + "text": "im", + "start": 15.1, + "end": 15.12, + "confidence": 0.05 + }, + { + "text": "Rätus", + "start": 15.12, + "end": 15.28, + "confidence": 0.665 + } + ] + } + ], + "language": "de", + "language_probs": { + "en": 0.003979361150413752, + "zh": 0.0001519044308224693, + "de": 0.9890514016151428, + "es": 0.00012993074778933078, + "ru": 0.00024085355107672513, + "ko": 5.632081229123287e-05, + "fr": 0.00034500681795179844, + "ja": 4.632823765859939e-05, + "pt": 0.0002543920709285885, + "tr": 0.0002227531367680058, + "pl": 0.00029741442995145917, + "ca": 6.455285301854019e-07, + "nl": 0.00042602652683854103, + "ar": 0.00012993074778933078, + "sv": 0.0003266458516009152, + "it": 0.0001239807897945866, + "id": 5.086642431706423e-07, + "hi": 3.259598452132195e-05, + "fi": 2.2755664758733474e-05, + "vi": 3.600468971853843e-06, + "he": 5.632081229123287e-05, + "uk": 7.864147846703418e-06, + "el": 5.798658548883395e-06, + "ms": 3.1037982353154803e-06, + "cs": 5.664333002641797e-06, + "ro": 9.48597244132543e-06, + "da": 0.00040021486347541213, + "hu": 3.0861257982905954e-05, + "ta": 3.001986499384657e-07, + "no": 6.042340464773588e-05, + "th": 4.016613729618257e-06, + "ur": 3.993743666796945e-05, + "hr": 2.361245378779131e-06, + "bg": 2.149938154616393e-06, + "lt": 4.0872319573281857e-07, + "la": 0.001671855105087161, + "mi": 1.2469075045373756e-05, + "ml": 6.898509923303209e-07, + "cy": 0.00010941266373265535, + "sk": 8.720533628547855e-07, + "te": 4.853707764596038e-07, + "fa": 1.208544199471362e-05, + "lv": 1.674373606874724e-06, + "bn": 2.893058081099298e-06, + "sr": 1.9575409169192426e-06, + "az": 5.077475179859903e-06, + "sl": 1.5277430065907538e-05, + "kn": 9.483140672728041e-08, + "et": 2.3246375349117443e-06, + "mk": 2.1370587433011679e-07, + "br": 9.358560782857239e-05, + "eu": 7.049376108625438e-06, + "is": 6.319019576039864e-06, + "hy": 1.0418302736070473e-05, + "ne": 6.660197868768591e-07, + "mn": 4.921257186651928e-06, + "bs": 3.0796443297731457e-06, + "kk": 5.166745040696696e-07, + "sq": 1.8246288391310372e-06, + "sw": 1.111024857891607e-06, + "gl": 4.998756139684701e-06, + "mr": 3.495994747026998e-07, + "pa": 3.07317634451465e-07, + "si": 1.1898074262717273e-05, + "km": 4.5967710320837796e-05, + "sn": 3.469824878266081e-05, + "yo": 5.7087581808445975e-06, + "so": 7.356683795478602e-08, + "af": 1.3169968042348046e-05, + "oc": 1.4019357877259608e-05, + "ka": 1.5546031590929488e-06, + "be": 1.0097765880345833e-05, + "tg": 1.7748824632235483e-08, + "sd": 2.634159272929537e-06, + "gu": 8.111359761642234e-08, + "am": 2.7226835186411336e-07, + "yi": 0.0002860206877812743, + "lo": 2.0471769346386282e-07, + "uz": 3.1354466245581136e-10, + "fo": 1.7861124433693476e-05, + "ht": 8.113782314467244e-06, + "ps": 4.5596365794153826e-07, + "tk": 1.6308678851828518e-09, + "nn": 0.0009751844918355346, + "mt": 1.0477962177901645e-06, + "sa": 6.368580670823576e-06, + "lb": 8.4853121506967e-07, + "my": 1.5185909205683856e-06, + "bo": 1.5852650676606572e-06, + "tl": 6.556940661539556e-07, + "mg": 1.8946131330466187e-09, + "as": 5.553116366741051e-08, + "tt": 4.195181535493475e-09, + "haw": 5.676254295394756e-05, + "ln": 4.454012980659172e-07, + "ha": 2.018775591139388e-09, + "ba": 9.71490776713324e-10, + "jw": 5.9023703215643764e-05, + "su": 8.410887541998591e-10 + } +} \ No newline at end of file diff --git a/tests/expected/tiny_auto/gloria.mp3.words.json b/tests/expected/tiny_auto/gloria.mp3.words.json new file mode 100644 index 0000000000000000000000000000000000000000..4c527d14675e524f00c5e964423d5067a1ce477b --- /dev/null +++ b/tests/expected/tiny_auto/gloria.mp3.words.json @@ -0,0 +1,677 @@ +{ + "text": " Hello. You're my girlfriend. How are you? I'm okay. Why will be? I said she could stay with us, but she feels better. Oh, she can. There's more to be for long. What if you can stay as long as you want? My girlfriend. Really, mixture. I agree.", + "segments": [ + { + "id": 0, + "seek": 0, + "start": 1.34, + "end": 1.78, + "text": " Hello.", + "tokens": [ + 50364, + 2425, + 13, + 50464 + ], + "temperature": 0.0, + "avg_logprob": -0.5507037403819325, + "compression_ratio": 1.4319526627218935, + "no_speech_prob": 0.11146047711372375, + "confidence": 0.407, + "words": [ + { + "text": "Hello.", + "start": 1.34, + "end": 1.78, + "confidence": 0.407 + } + ] + }, + { + "id": 1, + "seek": 0, + "start": 1.96, + "end": 4.26, + "text": " You're my girlfriend.", + "tokens": [ + 50464, + 509, + 434, + 452, + 10369, + 13, + 50614 + ], + "temperature": 0.0, + "avg_logprob": -0.5507037403819325, + "compression_ratio": 1.4319526627218935, + "no_speech_prob": 0.11146047711372375, + "confidence": 0.175, + "words": [ + { + "text": "You're", + "start": 1.96, + "end": 3.12, + "confidence": 0.192 + }, + { + "text": "my", + "start": 3.12, + "end": 3.2, + "confidence": 0.206 + }, + { + "text": "girlfriend.", + "start": 3.2, + "end": 4.26, + "confidence": 0.123 + } + ] + }, + { + "id": 2, + "seek": 0, + "start": 5.52, + "end": 6.54, + "text": " How are you?", + "tokens": [ + 50614, + 1012, + 366, + 291, + 30, + 50714 + ], + "temperature": 0.0, + "avg_logprob": -0.5507037403819325, + "compression_ratio": 1.4319526627218935, + "no_speech_prob": 0.11146047711372375, + "confidence": 0.627, + "words": [ + { + "text": "How", + "start": 5.52, + "end": 5.8, + "confidence": 0.49 + }, + { + "text": "are", + "start": 5.8, + "end": 6.16, + "confidence": 0.524 + }, + { + "text": "you?", + "start": 6.16, + "end": 6.54, + "confidence": 0.959 + } + ] + }, + { + "id": 3, + "seek": 0, + "start": 6.76, + "end": 7.8, + "text": " I'm okay.", + "tokens": [ + 50714, + 286, + 478, + 1392, + 13, + 50764 + ], + "temperature": 0.0, + "avg_logprob": -0.5507037403819325, + "compression_ratio": 1.4319526627218935, + "no_speech_prob": 0.11146047711372375, + "confidence": 0.836, + "words": [ + { + "text": "I'm", + "start": 6.76, + "end": 7.1, + "confidence": 0.838 + }, + { + "text": "okay.", + "start": 7.1, + "end": 7.8, + "confidence": 0.83 + } + ] + }, + { + "id": 4, + "seek": 0, + "start": 8.38, + "end": 9.14, + "text": " Why will be?", + "tokens": [ + 50764, + 1545, + 486, + 312, + 30, + 50814 + ], + "temperature": 0.0, + "avg_logprob": -0.5507037403819325, + "compression_ratio": 1.4319526627218935, + "no_speech_prob": 0.11146047711372375, + "confidence": 0.382, + "words": [ + { + "text": "Why", + "start": 8.38, + "end": 8.66, + "confidence": 0.343 + }, + { + "text": "will", + "start": 8.66, + "end": 8.96, + "confidence": 0.523 + }, + { + "text": "be?", + "start": 8.96, + "end": 9.14, + "confidence": 0.311 + } + ] + }, + { + "id": 5, + "seek": 0, + "start": 9.4, + "end": 11.52, + "text": " I said she could stay with us, but she feels better.", + "tokens": [ + 50814, + 286, + 848, + 750, + 727, + 1754, + 365, + 505, + 11, + 457, + 750, + 3417, + 1101, + 13, + 50964 + ], + "temperature": 0.0, + "avg_logprob": -0.5507037403819325, + "compression_ratio": 1.4319526627218935, + "no_speech_prob": 0.11146047711372375, + "confidence": 0.692, + "words": [ + { + "text": "I", + "start": 9.4, + "end": 9.52, + "confidence": 0.285 + }, + { + "text": "said", + "start": 9.52, + "end": 9.66, + "confidence": 0.621 + }, + { + "text": "she", + "start": 9.66, + "end": 9.82, + "confidence": 0.849 + }, + { + "text": "could", + "start": 9.82, + "end": 9.98, + "confidence": 0.912 + }, + { + "text": "stay", + "start": 9.98, + "end": 10.14, + "confidence": 0.992 + }, + { + "text": "with", + "start": 10.14, + "end": 10.26, + "confidence": 0.986 + }, + { + "text": "us,", + "start": 10.26, + "end": 10.44, + "confidence": 0.782 + }, + { + "text": "but", + "start": 10.64, + "end": 10.72, + "confidence": 0.227 + }, + { + "text": "she", + "start": 10.72, + "end": 10.94, + "confidence": 0.971 + }, + { + "text": "feels", + "start": 10.94, + "end": 11.24, + "confidence": 0.762 + }, + { + "text": "better.", + "start": 11.24, + "end": 11.52, + "confidence": 0.987 + } + ] + }, + { + "id": 6, + "seek": 0, + "start": 12.18, + "end": 13.44, + "text": " Oh, she can.", + "tokens": [ + 50964, + 876, + 11, + 750, + 393, + 13, + 51064 + ], + "temperature": 0.0, + "avg_logprob": -0.5507037403819325, + "compression_ratio": 1.4319526627218935, + "no_speech_prob": 0.11146047711372375, + "confidence": 0.287, + "words": [ + { + "text": "Oh,", + "start": 12.18, + "end": 12.6, + "confidence": 0.181 + }, + { + "text": "she", + "start": 12.8, + "end": 12.96, + "confidence": 0.686 + }, + { + "text": "can.", + "start": 12.96, + "end": 13.44, + "confidence": 0.191 + } + ] + }, + { + "id": 7, + "seek": 0, + "start": 13.5, + "end": 15.2, + "text": " There's more to be for long.", + "tokens": [ + 51064, + 821, + 311, + 544, + 281, + 312, + 337, + 938, + 13, + 51114 + ], + "temperature": 0.0, + "avg_logprob": -0.5507037403819325, + "compression_ratio": 1.4319526627218935, + "no_speech_prob": 0.11146047711372375, + "confidence": 0.682, + "words": [ + { + "text": "There's", + "start": 13.5, + "end": 14.44, + "confidence": 0.518 + }, + { + "text": "more", + "start": 14.44, + "end": 14.56, + "confidence": 0.814 + }, + { + "text": "to", + "start": 14.56, + "end": 14.74, + "confidence": 0.414 + }, + { + "text": "be", + "start": 14.74, + "end": 14.8, + "confidence": 0.949 + }, + { + "text": "for", + "start": 14.8, + "end": 15.0, + "confidence": 0.987 + }, + { + "text": "long.", + "start": 15.0, + "end": 15.2, + "confidence": 0.814 + } + ] + }, + { + "id": 8, + "seek": 0, + "start": 15.38, + "end": 16.86, + "text": " What if you can stay as long as you want?", + "tokens": [ + 51114, + 708, + 498, + 291, + 393, + 1754, + 382, + 938, + 382, + 291, + 528, + 30, + 51214 + ], + "temperature": 0.0, + "avg_logprob": -0.5507037403819325, + "compression_ratio": 1.4319526627218935, + "no_speech_prob": 0.11146047711372375, + "confidence": 0.771, + "words": [ + { + "text": "What", + "start": 15.38, + "end": 15.54, + "confidence": 0.387 + }, + { + "text": "if", + "start": 15.54, + "end": 15.62, + "confidence": 0.918 + }, + { + "text": "you", + "start": 15.62, + "end": 15.7, + "confidence": 0.97 + }, + { + "text": "can", + "start": 15.7, + "end": 15.98, + "confidence": 0.946 + }, + { + "text": "stay", + "start": 15.98, + "end": 16.12, + "confidence": 0.958 + }, + { + "text": "as", + "start": 16.12, + "end": 16.24, + "confidence": 0.308 + }, + { + "text": "long", + "start": 16.24, + "end": 16.36, + "confidence": 0.993 + }, + { + "text": "as", + "start": 16.36, + "end": 16.54, + "confidence": 0.992 + }, + { + "text": "you", + "start": 16.54, + "end": 16.62, + "confidence": 0.959 + }, + { + "text": "want?", + "start": 16.62, + "end": 16.86, + "confidence": 0.82 + } + ] + }, + { + "id": 9, + "seek": 0, + "start": 16.86, + "end": 17.74, + "text": " My girlfriend.", + "tokens": [ + 51214, + 1222, + 10369, + 13, + 51264 + ], + "temperature": 0.0, + "avg_logprob": -0.5507037403819325, + "compression_ratio": 1.4319526627218935, + "no_speech_prob": 0.11146047711372375, + "confidence": 0.141, + "words": [ + { + "text": "My", + "start": 16.86, + "end": 17.34, + "confidence": 0.125 + }, + { + "text": "girlfriend.", + "start": 17.34, + "end": 17.74, + "confidence": 0.159 + } + ] + }, + { + "id": 10, + "seek": 0, + "start": 17.98, + "end": 18.9, + "text": " Really, mixture.", + "tokens": [ + 51264, + 4083, + 11, + 9925, + 13, + 51314 + ], + "temperature": 0.0, + "avg_logprob": -0.5507037403819325, + "compression_ratio": 1.4319526627218935, + "no_speech_prob": 0.11146047711372375, + "confidence": 0.439, + "words": [ + { + "text": "Really,", + "start": 17.98, + "end": 18.34, + "confidence": 0.704 + }, + { + "text": "mixture.", + "start": 18.7, + "end": 18.9, + "confidence": 0.273 + } + ] + }, + { + "id": 11, + "seek": 0, + "start": 19.72, + "end": 20.22, + "text": " I agree.", + "tokens": [ + 51314, + 286, + 3986, + 13, + 51364 + ], + "temperature": 0.0, + "avg_logprob": -0.5507037403819325, + "compression_ratio": 1.4319526627218935, + "no_speech_prob": 0.11146047711372375, + "confidence": 0.16, + "words": [ + { + "text": "I", + "start": 19.72, + "end": 20.06, + "confidence": 0.098 + }, + { + "text": "agree.", + "start": 20.06, + "end": 20.22, + "confidence": 0.259 + } + ] + } + ], + "language": "en", + "language_probs": { + "en": 0.8432613015174866, + "zh": 0.0022250444162636995, + "de": 0.003997680731117725, + "es": 0.005014214664697647, + "ru": 0.006747363600879908, + "ko": 0.00396657083183527, + "fr": 0.004710419103503227, + "ja": 0.0019181080861017108, + "pt": 0.0026839158963412046, + "tr": 0.001666481141000986, + "pl": 0.0017193809617310762, + "ca": 0.0010107719572260976, + "nl": 0.005379467271268368, + "ar": 0.002295674756169319, + "sv": 0.003212226554751396, + "it": 0.001200321363285184, + "id": 0.00030586906359530985, + "hi": 0.0005284943035803735, + "fi": 0.0010428574169054627, + "vi": 0.0002763296652119607, + "he": 0.00021689364803023636, + "uk": 0.0008713398710824549, + "el": 0.0014365967363119125, + "ms": 0.0031133966986089945, + "cs": 0.0003689485020004213, + "ro": 0.00020375273015815765, + "da": 0.0017464574193581939, + "hu": 0.0004180734104011208, + "ta": 0.0002575675898697227, + "no": 0.000508248049300164, + "th": 0.0001611816551303491, + "ur": 0.0008185480255633593, + "hr": 7.886112871346995e-05, + "bg": 8.232354593928903e-05, + "lt": 0.0001188479145639576, + "la": 0.00432252325117588, + "mi": 0.0036972500383853912, + "ml": 0.0003281495883129537, + "cy": 0.06814596056938171, + "sk": 4.4933716708328575e-05, + "te": 0.0001057055196724832, + "fa": 9.219799540005624e-05, + "lv": 0.00012651293945964426, + "bn": 0.0001188479145639576, + "sr": 4.6541510528186336e-05, + "az": 2.8118798581999727e-05, + "sl": 0.000240079389186576, + "kn": 7.249770078487927e-06, + "et": 0.00010488291445653886, + "mk": 2.29498964472441e-05, + "br": 0.0006526034558191895, + "eu": 4.475853347685188e-05, + "is": 0.0007570332381874323, + "hy": 1.1405487384763546e-05, + "ne": 8.866594725986943e-05, + "mn": 4.2876046791207045e-05, + "bs": 0.0001756458223098889, + "kk": 1.1316729796817526e-05, + "sq": 4.9737089284462854e-05, + "sw": 0.0003011270018760115, + "gl": 0.0005538573605008423, + "mr": 1.3650581422552932e-05, + "pa": 8.643010005471297e-06, + "si": 3.431755612837151e-05, + "km": 0.0001798111479729414, + "sn": 0.0002595876867417246, + "yo": 0.00017157700494863093, + "so": 2.795035015878966e-06, + "af": 0.000512234284542501, + "oc": 7.437312160618603e-05, + "ka": 7.931271284178365e-06, + "be": 9.112384577747434e-05, + "tg": 3.491570339519967e-07, + "sd": 6.386368477251381e-05, + "gu": 3.547084133970202e-06, + "am": 8.247217010648455e-06, + "yi": 0.0001245515450136736, + "lo": 3.1302906791097485e-06, + "uz": 2.5990114504992334e-09, + "fo": 0.00025357434060424566, + "ht": 0.0002135310205630958, + "ps": 1.2773540220223367e-05, + "tk": 4.470028258651837e-08, + "nn": 0.00795033760368824, + "mt": 4.2376526835141703e-05, + "sa": 0.00010488291445653886, + "lb": 5.612301947621745e-07, + "my": 2.5904251742758788e-05, + "bo": 5.570289431489073e-05, + "tl": 0.0005582012236118317, + "mg": 8.244755633768364e-08, + "as": 4.501483999774791e-06, + "tt": 7.206338068499463e-07, + "haw": 0.004565494600683451, + "ln": 9.909259460982867e-06, + "ha": 1.484210372382222e-07, + "ba": 4.651499807550863e-08, + "jw": 0.0009569796384312212, + "su": 8.875615975512119e-08 + } +} \ No newline at end of file diff --git a/tests/expected/tiny_auto/japanese.mp3.words.json b/tests/expected/tiny_auto/japanese.mp3.words.json new file mode 100644 index 0000000000000000000000000000000000000000..aef90205227e57c0ebaaad94ef18635489395ab4 --- /dev/null +++ b/tests/expected/tiny_auto/japanese.mp3.words.json @@ -0,0 +1,1619 @@ +{ + "text": "いきます 入室タブでの最図免証記が実際と違う県に関するご質問いただいております同じ度面でデレクトリーごとに 別再度として管理上をしている際と針ます サプテレクトリーごとにわけたサイトはそれぞれ パブリシャーセンターに登録していくグルニュース上では 別再度として認識され パンコン愛行は最図ごと物物は正しく表示されますしかし グルニュースタブでは バブコン最図免証記ともに正しくない以上 時にいいなります こちらいたしても ではありませんパブコンはサプテレクトリーごとに 設定した", + "segments": [ + { + "id": 0, + "seek": 0, + "start": 0.08, + "end": 6.62, + "text": "いきます 入室タブでの最図免証記が実際と違う県に関するご質問いただいております", + "tokens": [ + 50364, + 47348, + 220, + 14028, + 2415, + 97, + 12144, + 28889, + 2474, + 2972, + 8661, + 3919, + 111, + 2347, + 235, + 5396, + 120, + 16958, + 5142, + 33197, + 34837, + 3193, + 49806, + 2862, + 234, + 4108, + 5196, + 95, + 22570, + 9991, + 43450, + 11361, + 32418, + 18549, + 6117, + 19420, + 50712 + ], + "temperature": 0.0, + "avg_logprob": -0.5681739258610345, + "compression_ratio": 1.582191780821918, + "no_speech_prob": 0.189762145280838, + "confidence": 0.551, + "words": [ + { + "text": "いきます", + "start": 0.08, + "end": 0.6, + "confidence": 0.153 + }, + { + "text": " ", + "start": 0.6, + "end": 1.18, + "confidence": 0.305 + }, + { + "text": "入", + "start": 1.18, + "end": 1.38, + "confidence": 0.435 + }, + { + "text": "室", + "start": 1.38, + "end": 1.52, + "confidence": 0.501 + }, + { + "text": "タ", + "start": 1.52, + "end": 1.68, + "confidence": 0.201 + }, + { + "text": "ブ", + "start": 1.68, + "end": 1.78, + "confidence": 0.837 + }, + { + "text": "で", + "start": 1.78, + "end": 1.98, + "confidence": 0.947 + }, + { + "text": "の", + "start": 1.98, + "end": 2.22, + "confidence": 0.907 + }, + { + "text": "最", + "start": 2.22, + "end": 2.64, + "confidence": 0.277 + }, + { + "text": "図", + "start": 2.64, + "end": 2.78, + "confidence": 0.349 + }, + { + "text": "免", + "start": 2.78, + "end": 2.98, + "confidence": 0.647 + }, + { + "text": "証", + "start": 2.98, + "end": 3.18, + "confidence": 0.282 + }, + { + "text": "記", + "start": 3.18, + "end": 3.32, + "confidence": 0.299 + }, + { + "text": "が", + "start": 3.32, + "end": 3.5, + "confidence": 0.976 + }, + { + "text": "実", + "start": 3.5, + "end": 3.74, + "confidence": 0.343 + }, + { + "text": "際", + "start": 3.74, + "end": 3.9, + "confidence": 0.975 + }, + { + "text": "と", + "start": 3.9, + "end": 4.08, + "confidence": 0.91 + }, + { + "text": "違う", + "start": 4.08, + "end": 4.38, + "confidence": 0.803 + }, + { + "text": "県", + "start": 4.38, + "end": 4.6, + "confidence": 0.405 + }, + { + "text": "に", + "start": 4.6, + "end": 4.74, + "confidence": 0.988 + }, + { + "text": "関", + "start": 4.74, + "end": 4.94, + "confidence": 0.543 + }, + { + "text": "する", + "start": 4.94, + "end": 5.12, + "confidence": 0.947 + }, + { + "text": "ご", + "start": 5.12, + "end": 5.3, + "confidence": 0.499 + }, + { + "text": "質", + "start": 5.3, + "end": 5.46, + "confidence": 0.943 + }, + { + "text": "問", + "start": 5.46, + "end": 5.6, + "confidence": 0.99 + }, + { + "text": "いただ", + "start": 5.6, + "end": 5.92, + "confidence": 0.922 + }, + { + "text": "いて", + "start": 5.92, + "end": 6.16, + "confidence": 0.982 + }, + { + "text": "お", + "start": 6.16, + "end": 6.26, + "confidence": 0.79 + }, + { + "text": "ります", + "start": 6.26, + "end": 6.62, + "confidence": 0.975 + } + ] + }, + { + "id": 1, + "seek": 0, + "start": 6.92, + "end": 12.9, + "text": "同じ度面でデレクトリーごとに 別再度として管理上をしている際と針", + "tokens": [ + 50712, + 13089, + 9257, + 13127, + 8833, + 2474, + 31327, + 16680, + 10825, + 7588, + 12376, + 3384, + 9991, + 3193, + 4108, + 220, + 16158, + 8623, + 13127, + 3193, + 8822, + 23131, + 13876, + 5708, + 5998, + 8822, + 22979, + 34837, + 3193, + 5873, + 251, + 51010 + ], + "temperature": 0.0, + "avg_logprob": -0.5681739258610345, + "compression_ratio": 1.582191780821918, + "no_speech_prob": 0.189762145280838, + "confidence": 0.524, + "words": [ + { + "text": "同", + "start": 6.92, + "end": 7.3, + "confidence": 0.83 + }, + { + "text": "じ", + "start": 7.3, + "end": 7.42, + "confidence": 0.227 + }, + { + "text": "度", + "start": 7.42, + "end": 7.6, + "confidence": 0.138 + }, + { + "text": "面", + "start": 7.6, + "end": 7.76, + "confidence": 0.296 + }, + { + "text": "で", + "start": 7.76, + "end": 8.0, + "confidence": 0.567 + }, + { + "text": "デ", + "start": 8.0, + "end": 8.16, + "confidence": 0.51 + }, + { + "text": "レ", + "start": 8.16, + "end": 8.28, + "confidence": 0.481 + }, + { + "text": "ク", + "start": 8.28, + "end": 8.36, + "confidence": 0.98 + }, + { + "text": "ト", + "start": 8.36, + "end": 8.5, + "confidence": 0.984 + }, + { + "text": "リ", + "start": 8.5, + "end": 8.62, + "confidence": 0.967 + }, + { + "text": "ー", + "start": 8.62, + "end": 8.7, + "confidence": 0.644 + }, + { + "text": "ご", + "start": 8.7, + "end": 8.84, + "confidence": 0.227 + }, + { + "text": "と", + "start": 8.84, + "end": 8.98, + "confidence": 0.988 + }, + { + "text": "に", + "start": 8.98, + "end": 9.14, + "confidence": 0.988 + }, + { + "text": " ", + "start": 9.14, + "end": 9.38, + "confidence": 0.261 + }, + { + "text": "別", + "start": 9.38, + "end": 9.42, + "confidence": 0.405 + }, + { + "text": "再", + "start": 9.42, + "end": 9.58, + "confidence": 0.427 + }, + { + "text": "度", + "start": 9.58, + "end": 9.74, + "confidence": 0.327 + }, + { + "text": "と", + "start": 9.74, + "end": 9.9, + "confidence": 0.886 + }, + { + "text": "して", + "start": 9.9, + "end": 10.3, + "confidence": 0.998 + }, + { + "text": "管", + "start": 10.3, + "end": 10.88, + "confidence": 0.821 + }, + { + "text": "理", + "start": 10.88, + "end": 11.06, + "confidence": 1.0 + }, + { + "text": "上", + "start": 11.06, + "end": 11.38, + "confidence": 0.466 + }, + { + "text": "を", + "start": 11.38, + "end": 11.54, + "confidence": 0.966 + }, + { + "text": "して", + "start": 11.54, + "end": 11.84, + "confidence": 0.916 + }, + { + "text": "いる", + "start": 11.84, + "end": 12.16, + "confidence": 0.979 + }, + { + "text": "際", + "start": 12.16, + "end": 12.54, + "confidence": 0.122 + }, + { + "text": "と", + "start": 12.54, + "end": 12.7, + "confidence": 0.712 + }, + { + "text": "針", + "start": 12.7, + "end": 12.9, + "confidence": 0.264 + } + ] + }, + { + "id": 2, + "seek": 0, + "start": 12.9, + "end": 19.55, + "text": "ます サプテレクトリーごとにわけたサイトはそれぞれ パブリシャーセンターに登録していく", + "tokens": [ + 51010, + 5368, + 220, + 23607, + 20953, + 22985, + 16680, + 10825, + 7588, + 12376, + 3384, + 9991, + 3193, + 4108, + 9206, + 7625, + 3368, + 23607, + 8040, + 7588, + 3065, + 13873, + 31563, + 4132, + 15096, + 239, + 28889, + 12376, + 11054, + 17233, + 3384, + 31223, + 4824, + 30736, + 4108, + 46246, + 8822, + 49394, + 51340 + ], + "temperature": 0.0, + "avg_logprob": -0.5681739258610345, + "compression_ratio": 1.582191780821918, + "no_speech_prob": 0.189762145280838, + "confidence": 0.715, + "words": [ + { + "text": "ます", + "start": 12.9, + "end": 13.22, + "confidence": 0.344 + }, + { + "text": " ", + "start": 13.22, + "end": 14.1, + "confidence": 0.34 + }, + { + "text": "サ", + "start": 14.1, + "end": 14.22, + "confidence": 0.555 + }, + { + "text": "プ", + "start": 14.22, + "end": 14.32, + "confidence": 0.786 + }, + { + "text": "テ", + "start": 14.32, + "end": 14.42, + "confidence": 0.622 + }, + { + "text": "レ", + "start": 14.42, + "end": 14.58, + "confidence": 0.865 + }, + { + "text": "ク", + "start": 14.58, + "end": 14.68, + "confidence": 0.996 + }, + { + "text": "ト", + "start": 14.68, + "end": 14.78, + "confidence": 0.999 + }, + { + "text": "リ", + "start": 14.78, + "end": 14.92, + "confidence": 0.996 + }, + { + "text": "ー", + "start": 14.92, + "end": 15.04, + "confidence": 0.996 + }, + { + "text": "ご", + "start": 15.04, + "end": 15.1, + "confidence": 0.965 + }, + { + "text": "と", + "start": 15.1, + "end": 15.38, + "confidence": 0.998 + }, + { + "text": "に", + "start": 15.38, + "end": 15.84, + "confidence": 0.625 + }, + { + "text": "わ", + "start": 15.84, + "end": 16.02, + "confidence": 0.739 + }, + { + "text": "け", + "start": 16.02, + "end": 16.14, + "confidence": 0.992 + }, + { + "text": "た", + "start": 16.14, + "end": 16.28, + "confidence": 0.885 + }, + { + "text": "サ", + "start": 16.28, + "end": 16.42, + "confidence": 0.304 + }, + { + "text": "イ", + "start": 16.42, + "end": 16.5, + "confidence": 0.976 + }, + { + "text": "ト", + "start": 16.5, + "end": 16.6, + "confidence": 0.932 + }, + { + "text": "は", + "start": 16.6, + "end": 17.08, + "confidence": 0.894 + }, + { + "text": "それ", + "start": 17.08, + "end": 17.46, + "confidence": 0.474 + }, + { + "text": "ぞ", + "start": 17.46, + "end": 17.64, + "confidence": 0.919 + }, + { + "text": "れ", + "start": 17.64, + "end": 17.72, + "confidence": 0.998 + }, + { + "text": " パ", + "start": 17.72, + "end": 17.86, + "confidence": 0.506 + }, + { + "text": "ブ", + "start": 17.86, + "end": 17.94, + "confidence": 0.961 + }, + { + "text": "リ", + "start": 17.94, + "end": 18.06, + "confidence": 0.988 + }, + { + "text": "シ", + "start": 18.06, + "end": 18.18, + "confidence": 0.542 + }, + { + "text": "ャ", + "start": 18.18, + "end": 18.26, + "confidence": 0.911 + }, + { + "text": "ー", + "start": 18.26, + "end": 18.42, + "confidence": 0.546 + }, + { + "text": "セ", + "start": 18.42, + "end": 18.44, + "confidence": 0.367 + }, + { + "text": "ン", + "start": 18.44, + "end": 18.48, + "confidence": 0.915 + }, + { + "text": "ター", + "start": 18.48, + "end": 18.6, + "confidence": 0.996 + }, + { + "text": "に", + "start": 18.6, + "end": 18.76, + "confidence": 0.707 + }, + { + "text": "登録", + "start": 18.76, + "end": 19.12, + "confidence": 0.668 + }, + { + "text": "して", + "start": 19.12, + "end": 19.38, + "confidence": 0.438 + }, + { + "text": "いく", + "start": 19.38, + "end": 19.55, + "confidence": 0.806 + } + ] + }, + { + "id": 3, + "seek": 0, + "start": 19.55, + "end": 27.08, + "text": "グルニュース上では 別再度として認識され パンコン愛行は最図ごと物物は正しく表示されます", + "tokens": [ + 51340, + 23839, + 9405, + 34737, + 26167, + 3384, + 9550, + 5708, + 16719, + 220, + 16158, + 8623, + 13127, + 3193, + 8822, + 22041, + 43143, + 6722, + 4132, + 220, + 23268, + 1047, + 111, + 18066, + 4824, + 15157, + 8082, + 3065, + 8661, + 3919, + 111, + 9991, + 3193, + 23516, + 23516, + 3065, + 15789, + 26568, + 40053, + 6722, + 4132, + 5368, + 51727 + ], + "temperature": 0.0, + "avg_logprob": -0.5681739258610345, + "compression_ratio": 1.582191780821918, + "no_speech_prob": 0.189762145280838, + "confidence": 0.554, + "words": [ + { + "text": "グ", + "start": 19.55, + "end": 19.78, + "confidence": 0.701 + }, + { + "text": "ル", + "start": 19.78, + "end": 19.88, + "confidence": 0.976 + }, + { + "text": "ニ", + "start": 19.88, + "end": 20.02, + "confidence": 0.899 + }, + { + "text": "ュ", + "start": 20.02, + "end": 20.14, + "confidence": 0.996 + }, + { + "text": "ー", + "start": 20.14, + "end": 20.18, + "confidence": 0.994 + }, + { + "text": "ス", + "start": 20.18, + "end": 20.22, + "confidence": 0.958 + }, + { + "text": "上", + "start": 20.22, + "end": 20.42, + "confidence": 0.313 + }, + { + "text": "では", + "start": 20.42, + "end": 20.82, + "confidence": 0.783 + }, + { + "text": " ", + "start": 20.82, + "end": 21.1, + "confidence": 0.595 + }, + { + "text": "別", + "start": 21.1, + "end": 21.16, + "confidence": 0.294 + }, + { + "text": "再", + "start": 21.16, + "end": 21.34, + "confidence": 0.84 + }, + { + "text": "度", + "start": 21.34, + "end": 21.46, + "confidence": 1.0 + }, + { + "text": "と", + "start": 21.46, + "end": 21.64, + "confidence": 0.992 + }, + { + "text": "して", + "start": 21.64, + "end": 21.82, + "confidence": 0.994 + }, + { + "text": "認", + "start": 21.82, + "end": 22.04, + "confidence": 0.497 + }, + { + "text": "識", + "start": 22.04, + "end": 22.2, + "confidence": 0.99 + }, + { + "text": "さ", + "start": 22.2, + "end": 22.34, + "confidence": 0.994 + }, + { + "text": "れ", + "start": 22.34, + "end": 22.7, + "confidence": 0.958 + }, + { + "text": " ", + "start": 22.7, + "end": 22.76, + "confidence": 0.204 + }, + { + "text": "パ", + "start": 22.76, + "end": 22.9, + "confidence": 0.039 + }, + { + "text": "ン", + "start": 22.9, + "end": 23.0, + "confidence": 0.332 + }, + { + "text": "コ", + "start": 23.0, + "end": 23.24, + "confidence": 0.918 + }, + { + "text": "ン", + "start": 23.24, + "end": 23.4, + "confidence": 0.807 + }, + { + "text": "愛", + "start": 23.4, + "end": 23.48, + "confidence": 0.239 + }, + { + "text": "行", + "start": 23.48, + "end": 23.64, + "confidence": 0.134 + }, + { + "text": "は", + "start": 23.64, + "end": 23.86, + "confidence": 0.959 + }, + { + "text": "最", + "start": 23.86, + "end": 24.1, + "confidence": 0.729 + }, + { + "text": "図", + "start": 24.1, + "end": 24.3, + "confidence": 0.948 + }, + { + "text": "ご", + "start": 24.3, + "end": 24.42, + "confidence": 0.154 + }, + { + "text": "と", + "start": 24.42, + "end": 24.52, + "confidence": 0.969 + }, + { + "text": "物", + "start": 24.52, + "end": 24.76, + "confidence": 0.238 + }, + { + "text": "物", + "start": 24.76, + "end": 24.92, + "confidence": 0.197 + }, + { + "text": "は", + "start": 24.92, + "end": 25.08, + "confidence": 0.566 + }, + { + "text": "正", + "start": 25.08, + "end": 25.36, + "confidence": 0.454 + }, + { + "text": "しく", + "start": 25.36, + "end": 25.64, + "confidence": 0.955 + }, + { + "text": "表示", + "start": 25.64, + "end": 26.0, + "confidence": 0.414 + }, + { + "text": "さ", + "start": 26.0, + "end": 26.28, + "confidence": 0.712 + }, + { + "text": "れ", + "start": 26.28, + "end": 26.62, + "confidence": 0.976 + }, + { + "text": "ます", + "start": 26.62, + "end": 27.08, + "confidence": 0.474 + } + ] + }, + { + "id": 4, + "seek": 2726, + "start": 27.36, + "end": 32.39, + "text": "しかし グルニュースタブでは バブコン最図免証記ともに正しくない", + "tokens": [ + 50364, + 32156, + 2849, + 220, + 23839, + 9405, + 34737, + 26167, + 3384, + 9550, + 12144, + 28889, + 16719, + 15096, + 238, + 28889, + 18066, + 4824, + 8661, + 3919, + 111, + 2347, + 235, + 5396, + 120, + 16958, + 3193, + 4801, + 4108, + 15789, + 26568, + 9311, + 50620 + ], + "temperature": 0.0, + "avg_logprob": -0.44616998208535685, + "compression_ratio": 1.375, + "no_speech_prob": 0.3626025915145874, + "confidence": 0.806, + "words": [ + { + "text": "しか", + "start": 27.36, + "end": 27.58, + "confidence": 0.959 + }, + { + "text": "し", + "start": 27.58, + "end": 27.74, + "confidence": 0.992 + }, + { + "text": " ", + "start": 27.74, + "end": 27.84, + "confidence": 0.249 + }, + { + "text": "グ", + "start": 27.84, + "end": 27.92, + "confidence": 0.445 + }, + { + "text": "ル", + "start": 27.92, + "end": 28.04, + "confidence": 0.995 + }, + { + "text": "ニ", + "start": 28.04, + "end": 28.24, + "confidence": 0.884 + }, + { + "text": "ュ", + "start": 28.24, + "end": 28.7, + "confidence": 0.995 + }, + { + "text": "ー", + "start": 28.7, + "end": 29.18, + "confidence": 0.999 + }, + { + "text": "ス", + "start": 29.18, + "end": 29.2, + "confidence": 0.97 + }, + { + "text": "タ", + "start": 29.2, + "end": 29.34, + "confidence": 0.992 + }, + { + "text": "ブ", + "start": 29.34, + "end": 29.44, + "confidence": 0.996 + }, + { + "text": "では", + "start": 29.44, + "end": 29.72, + "confidence": 0.979 + }, + { + "text": " バ", + "start": 29.72, + "end": 30.06, + "confidence": 0.503 + }, + { + "text": "ブ", + "start": 30.06, + "end": 30.16, + "confidence": 0.631 + }, + { + "text": "コ", + "start": 30.16, + "end": 30.34, + "confidence": 0.631 + }, + { + "text": "ン", + "start": 30.34, + "end": 30.42, + "confidence": 0.981 + }, + { + "text": "最", + "start": 30.42, + "end": 30.6, + "confidence": 0.659 + }, + { + "text": "図", + "start": 30.6, + "end": 30.88, + "confidence": 0.957 + }, + { + "text": "免", + "start": 30.88, + "end": 30.94, + "confidence": 0.977 + }, + { + "text": "証", + "start": 30.94, + "end": 31.12, + "confidence": 0.997 + }, + { + "text": "記", + "start": 31.12, + "end": 31.26, + "confidence": 0.994 + }, + { + "text": "と", + "start": 31.26, + "end": 31.42, + "confidence": 0.722 + }, + { + "text": "も", + "start": 31.42, + "end": 31.54, + "confidence": 0.839 + }, + { + "text": "に", + "start": 31.54, + "end": 31.66, + "confidence": 0.945 + }, + { + "text": "正", + "start": 31.66, + "end": 31.96, + "confidence": 0.481 + }, + { + "text": "しく", + "start": 31.96, + "end": 32.18, + "confidence": 0.999 + }, + { + "text": "ない", + "start": 32.18, + "end": 32.39, + "confidence": 0.938 + } + ] + }, + { + "id": 5, + "seek": 2726, + "start": 32.39, + "end": 36.34, + "text": "以上 時にいいなります こちらいたしても ではありません", + "tokens": [ + 50620, + 29497, + 220, + 6611, + 4108, + 13806, + 3203, + 19420, + 14384, + 28567, + 17679, + 8822, + 4801, + 220, + 16719, + 14498, + 30250, + 50838 + ], + "temperature": 0.0, + "avg_logprob": -0.44616998208535685, + "compression_ratio": 1.375, + "no_speech_prob": 0.3626025915145874, + "confidence": 0.456, + "words": [ + { + "text": "以上", + "start": 32.39, + "end": 32.74, + "confidence": 0.31 + }, + { + "text": " ", + "start": 32.74, + "end": 33.04, + "confidence": 0.128 + }, + { + "text": "時", + "start": 33.04, + "end": 33.1, + "confidence": 0.355 + }, + { + "text": "に", + "start": 33.1, + "end": 33.12, + "confidence": 0.791 + }, + { + "text": "いい", + "start": 33.12, + "end": 33.36, + "confidence": 0.621 + }, + { + "text": "な", + "start": 33.36, + "end": 33.48, + "confidence": 0.793 + }, + { + "text": "ります", + "start": 33.48, + "end": 34.02, + "confidence": 0.896 + }, + { + "text": " こ", + "start": 34.02, + "end": 34.38, + "confidence": 0.328 + }, + { + "text": "ちら", + "start": 34.38, + "end": 34.56, + "confidence": 0.684 + }, + { + "text": "いた", + "start": 34.56, + "end": 34.84, + "confidence": 0.571 + }, + { + "text": "して", + "start": 34.84, + "end": 35.04, + "confidence": 0.437 + }, + { + "text": "も", + "start": 35.04, + "end": 35.18, + "confidence": 0.422 + }, + { + "text": " ", + "start": 35.18, + "end": 35.38, + "confidence": 0.244 + }, + { + "text": "では", + "start": 35.38, + "end": 35.46, + "confidence": 0.139 + }, + { + "text": "あり", + "start": 35.46, + "end": 35.72, + "confidence": 0.903 + }, + { + "text": "ません", + "start": 35.72, + "end": 36.34, + "confidence": 0.997 + } + ] + }, + { + "id": 6, + "seek": 2726, + "start": 36.42, + "end": 40.4, + "text": "パブコンはサプテレクトリーごとに 設定した", + "tokens": [ + 50838, + 23268, + 28889, + 18066, + 4824, + 3065, + 23607, + 20953, + 22985, + 16680, + 10825, + 7588, + 12376, + 3384, + 9991, + 3193, + 4108, + 220, + 39035, + 12088, + 8533, + 51042 + ], + "temperature": 0.0, + "avg_logprob": -0.44616998208535685, + "compression_ratio": 1.375, + "no_speech_prob": 0.3626025915145874, + "confidence": 0.849, + "words": [ + { + "text": "パ", + "start": 36.42, + "end": 36.92, + "confidence": 0.482 + }, + { + "text": "ブ", + "start": 36.92, + "end": 37.04, + "confidence": 0.648 + }, + { + "text": "コ", + "start": 37.04, + "end": 37.2, + "confidence": 0.689 + }, + { + "text": "ン", + "start": 37.2, + "end": 37.72, + "confidence": 0.994 + }, + { + "text": "は", + "start": 37.72, + "end": 37.74, + "confidence": 0.975 + }, + { + "text": "サ", + "start": 37.74, + "end": 38.22, + "confidence": 0.668 + }, + { + "text": "プ", + "start": 38.22, + "end": 38.32, + "confidence": 0.572 + }, + { + "text": "テ", + "start": 38.32, + "end": 38.42, + "confidence": 0.984 + }, + { + "text": "レ", + "start": 38.42, + "end": 38.56, + "confidence": 0.997 + }, + { + "text": "ク", + "start": 38.56, + "end": 38.68, + "confidence": 0.997 + }, + { + "text": "ト", + "start": 38.68, + "end": 38.78, + "confidence": 0.998 + }, + { + "text": "リ", + "start": 38.78, + "end": 38.92, + "confidence": 0.999 + }, + { + "text": "ー", + "start": 38.92, + "end": 38.96, + "confidence": 0.987 + }, + { + "text": "ご", + "start": 38.96, + "end": 39.08, + "confidence": 0.959 + }, + { + "text": "と", + "start": 39.08, + "end": 39.26, + "confidence": 0.999 + }, + { + "text": "に", + "start": 39.26, + "end": 39.58, + "confidence": 0.974 + }, + { + "text": " ", + "start": 39.58, + "end": 39.66, + "confidence": 0.663 + }, + { + "text": "設", + "start": 39.66, + "end": 39.82, + "confidence": 0.911 + }, + { + "text": "定", + "start": 39.82, + "end": 40.02, + "confidence": 0.999 + }, + { + "text": "した", + "start": 40.02, + "end": 40.4, + "confidence": 0.873 + } + ] + } + ], + "language": "ja", + "language_probs": { + "en": 0.006242657545953989, + "zh": 0.0014827612321823835, + "de": 0.00011256561992922798, + "es": 0.0013291386421769857, + "ru": 0.00022561925288755447, + "ko": 0.00042481819400563836, + "fr": 0.0003206696128472686, + "ja": 0.9862462282180786, + "pt": 0.0003521866456139833, + "tr": 8.698396413819864e-05, + "pl": 0.0008716703741811216, + "ca": 1.310503307649924e-06, + "nl": 1.0388754162704572e-05, + "ar": 1.634380350878928e-05, + "sv": 1.8519956938689575e-05, + "it": 0.0001502948289271444, + "id": 1.4650489902123809e-05, + "hi": 3.542034392012283e-05, + "fi": 3.327432932564989e-05, + "vi": 9.459067769057583e-06, + "he": 1.488120233261725e-05, + "uk": 2.396660238446202e-05, + "el": 3.683132672449574e-05, + "ms": 3.514470154186711e-05, + "cs": 1.2629512639250606e-05, + "ro": 2.034019234997686e-05, + "da": 7.294049737538444e-07, + "hu": 8.41306882648496e-06, + "ta": 3.047011659873533e-06, + "no": 4.935400852446037e-07, + "th": 2.396660238446202e-05, + "ur": 1.823282946133986e-05, + "hr": 3.2435270895803114e-06, + "bg": 5.906901492380712e-07, + "lt": 1.666117981358184e-07, + "la": 0.00018271202861797065, + "mi": 8.044702553888783e-05, + "ml": 1.6182557374122553e-06, + "cy": 6.168086838442832e-05, + "sk": 7.948603979457403e-07, + "te": 2.2118931610748405e-06, + "fa": 1.647198951104656e-05, + "lv": 2.2245595232561755e-07, + "bn": 1.0470233064552303e-05, + "sr": 5.132005185259914e-07, + "az": 6.641308232246956e-07, + "sl": 1.0286258884661947e-06, + "kn": 4.97411008382187e-07, + "et": 6.641308232246956e-07, + "mk": 2.2420069001327647e-07, + "br": 3.301538890809752e-05, + "eu": 3.920674862456508e-05, + "is": 1.7324887835457048e-07, + "hy": 1.6566315252930508e-06, + "ne": 9.148787967205863e-07, + "mn": 2.098585719068069e-05, + "bs": 1.1565151680770214e-06, + "kk": 2.4623628291919886e-07, + "sq": 8.798302815193892e-07, + "sw": 8.885971510608215e-06, + "gl": 4.239260306349024e-05, + "mr": 5.725165124204068e-07, + "pa": 1.6309478496623342e-06, + "si": 1.4423355423787143e-05, + "km": 4.045130481244996e-05, + "sn": 2.304845656908583e-05, + "yo": 3.3991873351624236e-06, + "so": 2.3866036258368695e-07, + "af": 9.969784287022776e-07, + "oc": 5.474488716572523e-06, + "ka": 1.0864454225156805e-06, + "be": 5.692566901416285e-06, + "tg": 1.913662650565584e-08, + "sd": 1.6959174899966456e-06, + "gu": 3.2115266890286875e-07, + "am": 1.2975741014997766e-07, + "yi": 4.197435828245943e-06, + "lo": 2.600773427730019e-07, + "uz": 3.430495609801909e-10, + "fo": 1.4281055200626724e-06, + "ht": 2.373014922341099e-06, + "ps": 1.5321337514251354e-06, + "tk": 7.745855623575437e-10, + "nn": 0.0009135027066804469, + "mt": 1.0673553418882875e-07, + "sa": 1.7262496839975938e-05, + "lb": 3.051601860093456e-09, + "my": 2.098585719068069e-05, + "bo": 1.303041608480271e-05, + "tl": 7.029382231849013e-06, + "mg": 1.3073606641711422e-09, + "as": 4.321581172916922e-07, + "tt": 3.4714515706468774e-09, + "haw": 2.8909242246299982e-05, + "ln": 8.594491305302654e-07, + "ha": 6.384976991569147e-09, + "ba": 5.375886957814657e-10, + "jw": 0.00019148056162521243, + "su": 3.087572864046706e-09 + } +} \ No newline at end of file diff --git a/tests/expected/tiny_auto/jp_japanese.mp3.words.json b/tests/expected/tiny_auto/jp_japanese.mp3.words.json new file mode 100644 index 0000000000000000000000000000000000000000..11667c628b7040a6f550c2ae1dfa9837a6a5be74 --- /dev/null +++ b/tests/expected/tiny_auto/jp_japanese.mp3.words.json @@ -0,0 +1,1518 @@ +{ + "text": "いきます 入室タブでの最図免証記が実際と違う県に関するご質問いただいております同じ度面でデレクトリーごとに 別再度として管理上をしている際と針ます サプテレクトリーごとにわけたサイトはそれぞれ パブリシャーセンターに登録していくグルニュース上では 別再度として認識され パンコン愛行は最図ごと物物は正しく表示されますしかし グルニュースタブでは バブコン最図免証記ともに正しくない以上 時にいいなります こちらいたしても ではありませんパブコンはサプテレクトリーごとに 設定した", + "segments": [ + { + "id": 0, + "seek": 0, + "start": 0.08, + "end": 6.62, + "text": "いきます 入室タブでの最図免証記が実際と違う県に関するご質問いただいております", + "tokens": [ + 50364, + 47348, + 220, + 14028, + 2415, + 97, + 12144, + 28889, + 2474, + 2972, + 8661, + 3919, + 111, + 2347, + 235, + 5396, + 120, + 16958, + 5142, + 33197, + 34837, + 3193, + 49806, + 2862, + 234, + 4108, + 5196, + 95, + 22570, + 9991, + 43450, + 11361, + 32418, + 18549, + 6117, + 19420, + 50712 + ], + "temperature": 0.0, + "avg_logprob": -0.5681739258610345, + "compression_ratio": 1.582191780821918, + "no_speech_prob": 0.189762145280838, + "confidence": 0.551, + "words": [ + { + "text": "いきます", + "start": 0.08, + "end": 0.6, + "confidence": 0.153 + }, + { + "text": " ", + "start": 0.6, + "end": 1.18, + "confidence": 0.305 + }, + { + "text": "入", + "start": 1.18, + "end": 1.38, + "confidence": 0.435 + }, + { + "text": "室", + "start": 1.38, + "end": 1.52, + "confidence": 0.501 + }, + { + "text": "タ", + "start": 1.52, + "end": 1.68, + "confidence": 0.201 + }, + { + "text": "ブ", + "start": 1.68, + "end": 1.78, + "confidence": 0.837 + }, + { + "text": "で", + "start": 1.78, + "end": 1.98, + "confidence": 0.947 + }, + { + "text": "の", + "start": 1.98, + "end": 2.22, + "confidence": 0.907 + }, + { + "text": "最", + "start": 2.22, + "end": 2.64, + "confidence": 0.277 + }, + { + "text": "図", + "start": 2.64, + "end": 2.78, + "confidence": 0.349 + }, + { + "text": "免", + "start": 2.78, + "end": 2.98, + "confidence": 0.647 + }, + { + "text": "証", + "start": 2.98, + "end": 3.18, + "confidence": 0.282 + }, + { + "text": "記", + "start": 3.18, + "end": 3.32, + "confidence": 0.299 + }, + { + "text": "が", + "start": 3.32, + "end": 3.5, + "confidence": 0.976 + }, + { + "text": "実", + "start": 3.5, + "end": 3.74, + "confidence": 0.343 + }, + { + "text": "際", + "start": 3.74, + "end": 3.9, + "confidence": 0.975 + }, + { + "text": "と", + "start": 3.9, + "end": 4.08, + "confidence": 0.91 + }, + { + "text": "違う", + "start": 4.08, + "end": 4.38, + "confidence": 0.803 + }, + { + "text": "県", + "start": 4.38, + "end": 4.6, + "confidence": 0.405 + }, + { + "text": "に", + "start": 4.6, + "end": 4.74, + "confidence": 0.988 + }, + { + "text": "関", + "start": 4.74, + "end": 4.94, + "confidence": 0.543 + }, + { + "text": "する", + "start": 4.94, + "end": 5.12, + "confidence": 0.947 + }, + { + "text": "ご", + "start": 5.12, + "end": 5.3, + "confidence": 0.499 + }, + { + "text": "質", + "start": 5.3, + "end": 5.46, + "confidence": 0.943 + }, + { + "text": "問", + "start": 5.46, + "end": 5.6, + "confidence": 0.99 + }, + { + "text": "いただ", + "start": 5.6, + "end": 5.92, + "confidence": 0.922 + }, + { + "text": "いて", + "start": 5.92, + "end": 6.16, + "confidence": 0.982 + }, + { + "text": "お", + "start": 6.16, + "end": 6.26, + "confidence": 0.79 + }, + { + "text": "ります", + "start": 6.26, + "end": 6.62, + "confidence": 0.975 + } + ] + }, + { + "id": 1, + "seek": 0, + "start": 6.92, + "end": 12.9, + "text": "同じ度面でデレクトリーごとに 別再度として管理上をしている際と針", + "tokens": [ + 50712, + 13089, + 9257, + 13127, + 8833, + 2474, + 31327, + 16680, + 10825, + 7588, + 12376, + 3384, + 9991, + 3193, + 4108, + 220, + 16158, + 8623, + 13127, + 3193, + 8822, + 23131, + 13876, + 5708, + 5998, + 8822, + 22979, + 34837, + 3193, + 5873, + 251, + 51010 + ], + "temperature": 0.0, + "avg_logprob": -0.5681739258610345, + "compression_ratio": 1.582191780821918, + "no_speech_prob": 0.189762145280838, + "confidence": 0.524, + "words": [ + { + "text": "同", + "start": 6.92, + "end": 7.3, + "confidence": 0.83 + }, + { + "text": "じ", + "start": 7.3, + "end": 7.42, + "confidence": 0.227 + }, + { + "text": "度", + "start": 7.42, + "end": 7.6, + "confidence": 0.138 + }, + { + "text": "面", + "start": 7.6, + "end": 7.76, + "confidence": 0.296 + }, + { + "text": "で", + "start": 7.76, + "end": 8.0, + "confidence": 0.567 + }, + { + "text": "デ", + "start": 8.0, + "end": 8.16, + "confidence": 0.51 + }, + { + "text": "レ", + "start": 8.16, + "end": 8.28, + "confidence": 0.481 + }, + { + "text": "ク", + "start": 8.28, + "end": 8.36, + "confidence": 0.98 + }, + { + "text": "ト", + "start": 8.36, + "end": 8.5, + "confidence": 0.984 + }, + { + "text": "リ", + "start": 8.5, + "end": 8.62, + "confidence": 0.967 + }, + { + "text": "ー", + "start": 8.62, + "end": 8.7, + "confidence": 0.644 + }, + { + "text": "ご", + "start": 8.7, + "end": 8.84, + "confidence": 0.227 + }, + { + "text": "と", + "start": 8.84, + "end": 8.98, + "confidence": 0.988 + }, + { + "text": "に", + "start": 8.98, + "end": 9.14, + "confidence": 0.988 + }, + { + "text": " ", + "start": 9.14, + "end": 9.38, + "confidence": 0.261 + }, + { + "text": "別", + "start": 9.38, + "end": 9.42, + "confidence": 0.405 + }, + { + "text": "再", + "start": 9.42, + "end": 9.58, + "confidence": 0.427 + }, + { + "text": "度", + "start": 9.58, + "end": 9.74, + "confidence": 0.327 + }, + { + "text": "と", + "start": 9.74, + "end": 9.9, + "confidence": 0.886 + }, + { + "text": "して", + "start": 9.9, + "end": 10.3, + "confidence": 0.998 + }, + { + "text": "管", + "start": 10.3, + "end": 10.88, + "confidence": 0.821 + }, + { + "text": "理", + "start": 10.88, + "end": 11.06, + "confidence": 1.0 + }, + { + "text": "上", + "start": 11.06, + "end": 11.38, + "confidence": 0.466 + }, + { + "text": "を", + "start": 11.38, + "end": 11.54, + "confidence": 0.966 + }, + { + "text": "して", + "start": 11.54, + "end": 11.84, + "confidence": 0.916 + }, + { + "text": "いる", + "start": 11.84, + "end": 12.16, + "confidence": 0.979 + }, + { + "text": "際", + "start": 12.16, + "end": 12.54, + "confidence": 0.122 + }, + { + "text": "と", + "start": 12.54, + "end": 12.7, + "confidence": 0.712 + }, + { + "text": "針", + "start": 12.7, + "end": 12.9, + "confidence": 0.264 + } + ] + }, + { + "id": 2, + "seek": 0, + "start": 12.9, + "end": 19.55, + "text": "ます サプテレクトリーごとにわけたサイトはそれぞれ パブリシャーセンターに登録していく", + "tokens": [ + 51010, + 5368, + 220, + 23607, + 20953, + 22985, + 16680, + 10825, + 7588, + 12376, + 3384, + 9991, + 3193, + 4108, + 9206, + 7625, + 3368, + 23607, + 8040, + 7588, + 3065, + 13873, + 31563, + 4132, + 15096, + 239, + 28889, + 12376, + 11054, + 17233, + 3384, + 31223, + 4824, + 30736, + 4108, + 46246, + 8822, + 49394, + 51340 + ], + "temperature": 0.0, + "avg_logprob": -0.5681739258610345, + "compression_ratio": 1.582191780821918, + "no_speech_prob": 0.189762145280838, + "confidence": 0.715, + "words": [ + { + "text": "ます", + "start": 12.9, + "end": 13.22, + "confidence": 0.344 + }, + { + "text": " ", + "start": 13.22, + "end": 14.1, + "confidence": 0.34 + }, + { + "text": "サ", + "start": 14.1, + "end": 14.22, + "confidence": 0.555 + }, + { + "text": "プ", + "start": 14.22, + "end": 14.32, + "confidence": 0.786 + }, + { + "text": "テ", + "start": 14.32, + "end": 14.42, + "confidence": 0.622 + }, + { + "text": "レ", + "start": 14.42, + "end": 14.58, + "confidence": 0.865 + }, + { + "text": "ク", + "start": 14.58, + "end": 14.68, + "confidence": 0.996 + }, + { + "text": "ト", + "start": 14.68, + "end": 14.78, + "confidence": 0.999 + }, + { + "text": "リ", + "start": 14.78, + "end": 14.92, + "confidence": 0.996 + }, + { + "text": "ー", + "start": 14.92, + "end": 15.04, + "confidence": 0.996 + }, + { + "text": "ご", + "start": 15.04, + "end": 15.1, + "confidence": 0.965 + }, + { + "text": "と", + "start": 15.1, + "end": 15.38, + "confidence": 0.998 + }, + { + "text": "に", + "start": 15.38, + "end": 15.84, + "confidence": 0.625 + }, + { + "text": "わ", + "start": 15.84, + "end": 16.02, + "confidence": 0.739 + }, + { + "text": "け", + "start": 16.02, + "end": 16.14, + "confidence": 0.992 + }, + { + "text": "た", + "start": 16.14, + "end": 16.28, + "confidence": 0.885 + }, + { + "text": "サ", + "start": 16.28, + "end": 16.42, + "confidence": 0.304 + }, + { + "text": "イ", + "start": 16.42, + "end": 16.5, + "confidence": 0.976 + }, + { + "text": "ト", + "start": 16.5, + "end": 16.6, + "confidence": 0.932 + }, + { + "text": "は", + "start": 16.6, + "end": 17.08, + "confidence": 0.894 + }, + { + "text": "それ", + "start": 17.08, + "end": 17.46, + "confidence": 0.474 + }, + { + "text": "ぞ", + "start": 17.46, + "end": 17.64, + "confidence": 0.919 + }, + { + "text": "れ", + "start": 17.64, + "end": 17.72, + "confidence": 0.998 + }, + { + "text": " パ", + "start": 17.72, + "end": 17.86, + "confidence": 0.506 + }, + { + "text": "ブ", + "start": 17.86, + "end": 17.94, + "confidence": 0.961 + }, + { + "text": "リ", + "start": 17.94, + "end": 18.06, + "confidence": 0.988 + }, + { + "text": "シ", + "start": 18.06, + "end": 18.18, + "confidence": 0.542 + }, + { + "text": "ャ", + "start": 18.18, + "end": 18.26, + "confidence": 0.911 + }, + { + "text": "ー", + "start": 18.26, + "end": 18.42, + "confidence": 0.546 + }, + { + "text": "セ", + "start": 18.42, + "end": 18.44, + "confidence": 0.367 + }, + { + "text": "ン", + "start": 18.44, + "end": 18.48, + "confidence": 0.915 + }, + { + "text": "ター", + "start": 18.48, + "end": 18.6, + "confidence": 0.996 + }, + { + "text": "に", + "start": 18.6, + "end": 18.76, + "confidence": 0.707 + }, + { + "text": "登録", + "start": 18.76, + "end": 19.12, + "confidence": 0.668 + }, + { + "text": "して", + "start": 19.12, + "end": 19.38, + "confidence": 0.438 + }, + { + "text": "いく", + "start": 19.38, + "end": 19.55, + "confidence": 0.806 + } + ] + }, + { + "id": 3, + "seek": 0, + "start": 19.55, + "end": 27.08, + "text": "グルニュース上では 別再度として認識され パンコン愛行は最図ごと物物は正しく表示されます", + "tokens": [ + 51340, + 23839, + 9405, + 34737, + 26167, + 3384, + 9550, + 5708, + 16719, + 220, + 16158, + 8623, + 13127, + 3193, + 8822, + 22041, + 43143, + 6722, + 4132, + 220, + 23268, + 1047, + 111, + 18066, + 4824, + 15157, + 8082, + 3065, + 8661, + 3919, + 111, + 9991, + 3193, + 23516, + 23516, + 3065, + 15789, + 26568, + 40053, + 6722, + 4132, + 5368, + 51727 + ], + "temperature": 0.0, + "avg_logprob": -0.5681739258610345, + "compression_ratio": 1.582191780821918, + "no_speech_prob": 0.189762145280838, + "confidence": 0.554, + "words": [ + { + "text": "グ", + "start": 19.55, + "end": 19.78, + "confidence": 0.701 + }, + { + "text": "ル", + "start": 19.78, + "end": 19.88, + "confidence": 0.976 + }, + { + "text": "ニ", + "start": 19.88, + "end": 20.02, + "confidence": 0.899 + }, + { + "text": "ュ", + "start": 20.02, + "end": 20.14, + "confidence": 0.996 + }, + { + "text": "ー", + "start": 20.14, + "end": 20.18, + "confidence": 0.994 + }, + { + "text": "ス", + "start": 20.18, + "end": 20.22, + "confidence": 0.958 + }, + { + "text": "上", + "start": 20.22, + "end": 20.42, + "confidence": 0.313 + }, + { + "text": "では", + "start": 20.42, + "end": 20.82, + "confidence": 0.783 + }, + { + "text": " ", + "start": 20.82, + "end": 21.1, + "confidence": 0.595 + }, + { + "text": "別", + "start": 21.1, + "end": 21.16, + "confidence": 0.294 + }, + { + "text": "再", + "start": 21.16, + "end": 21.34, + "confidence": 0.84 + }, + { + "text": "度", + "start": 21.34, + "end": 21.46, + "confidence": 1.0 + }, + { + "text": "と", + "start": 21.46, + "end": 21.64, + "confidence": 0.992 + }, + { + "text": "して", + "start": 21.64, + "end": 21.82, + "confidence": 0.994 + }, + { + "text": "認", + "start": 21.82, + "end": 22.04, + "confidence": 0.497 + }, + { + "text": "識", + "start": 22.04, + "end": 22.2, + "confidence": 0.99 + }, + { + "text": "さ", + "start": 22.2, + "end": 22.34, + "confidence": 0.994 + }, + { + "text": "れ", + "start": 22.34, + "end": 22.7, + "confidence": 0.958 + }, + { + "text": " ", + "start": 22.7, + "end": 22.76, + "confidence": 0.204 + }, + { + "text": "パ", + "start": 22.76, + "end": 22.9, + "confidence": 0.039 + }, + { + "text": "ン", + "start": 22.9, + "end": 23.0, + "confidence": 0.332 + }, + { + "text": "コ", + "start": 23.0, + "end": 23.24, + "confidence": 0.918 + }, + { + "text": "ン", + "start": 23.24, + "end": 23.4, + "confidence": 0.807 + }, + { + "text": "愛", + "start": 23.4, + "end": 23.48, + "confidence": 0.239 + }, + { + "text": "行", + "start": 23.48, + "end": 23.64, + "confidence": 0.134 + }, + { + "text": "は", + "start": 23.64, + "end": 23.86, + "confidence": 0.959 + }, + { + "text": "最", + "start": 23.86, + "end": 24.1, + "confidence": 0.729 + }, + { + "text": "図", + "start": 24.1, + "end": 24.3, + "confidence": 0.948 + }, + { + "text": "ご", + "start": 24.3, + "end": 24.42, + "confidence": 0.154 + }, + { + "text": "と", + "start": 24.42, + "end": 24.52, + "confidence": 0.969 + }, + { + "text": "物", + "start": 24.52, + "end": 24.76, + "confidence": 0.238 + }, + { + "text": "物", + "start": 24.76, + "end": 24.92, + "confidence": 0.197 + }, + { + "text": "は", + "start": 24.92, + "end": 25.08, + "confidence": 0.566 + }, + { + "text": "正", + "start": 25.08, + "end": 25.36, + "confidence": 0.454 + }, + { + "text": "しく", + "start": 25.36, + "end": 25.64, + "confidence": 0.955 + }, + { + "text": "表示", + "start": 25.64, + "end": 26.0, + "confidence": 0.414 + }, + { + "text": "さ", + "start": 26.0, + "end": 26.28, + "confidence": 0.712 + }, + { + "text": "れ", + "start": 26.28, + "end": 26.62, + "confidence": 0.976 + }, + { + "text": "ます", + "start": 26.62, + "end": 27.08, + "confidence": 0.474 + } + ] + }, + { + "id": 4, + "seek": 2726, + "start": 27.36, + "end": 32.39, + "text": "しかし グルニュースタブでは バブコン最図免証記ともに正しくない", + "tokens": [ + 50364, + 32156, + 2849, + 220, + 23839, + 9405, + 34737, + 26167, + 3384, + 9550, + 12144, + 28889, + 16719, + 15096, + 238, + 28889, + 18066, + 4824, + 8661, + 3919, + 111, + 2347, + 235, + 5396, + 120, + 16958, + 3193, + 4801, + 4108, + 15789, + 26568, + 9311, + 50620 + ], + "temperature": 0.0, + "avg_logprob": -0.44616998208535685, + "compression_ratio": 1.375, + "no_speech_prob": 0.3626025915145874, + "confidence": 0.806, + "words": [ + { + "text": "しか", + "start": 27.36, + "end": 27.58, + "confidence": 0.959 + }, + { + "text": "し", + "start": 27.58, + "end": 27.74, + "confidence": 0.992 + }, + { + "text": " ", + "start": 27.74, + "end": 27.84, + "confidence": 0.249 + }, + { + "text": "グ", + "start": 27.84, + "end": 27.92, + "confidence": 0.445 + }, + { + "text": "ル", + "start": 27.92, + "end": 28.04, + "confidence": 0.995 + }, + { + "text": "ニ", + "start": 28.04, + "end": 28.24, + "confidence": 0.884 + }, + { + "text": "ュ", + "start": 28.24, + "end": 28.7, + "confidence": 0.995 + }, + { + "text": "ー", + "start": 28.7, + "end": 29.18, + "confidence": 0.999 + }, + { + "text": "ス", + "start": 29.18, + "end": 29.2, + "confidence": 0.97 + }, + { + "text": "タ", + "start": 29.2, + "end": 29.34, + "confidence": 0.992 + }, + { + "text": "ブ", + "start": 29.34, + "end": 29.44, + "confidence": 0.996 + }, + { + "text": "では", + "start": 29.44, + "end": 29.72, + "confidence": 0.979 + }, + { + "text": " バ", + "start": 29.72, + "end": 30.06, + "confidence": 0.503 + }, + { + "text": "ブ", + "start": 30.06, + "end": 30.16, + "confidence": 0.631 + }, + { + "text": "コ", + "start": 30.16, + "end": 30.34, + "confidence": 0.631 + }, + { + "text": "ン", + "start": 30.34, + "end": 30.42, + "confidence": 0.981 + }, + { + "text": "最", + "start": 30.42, + "end": 30.6, + "confidence": 0.659 + }, + { + "text": "図", + "start": 30.6, + "end": 30.88, + "confidence": 0.957 + }, + { + "text": "免", + "start": 30.88, + "end": 30.94, + "confidence": 0.977 + }, + { + "text": "証", + "start": 30.94, + "end": 31.12, + "confidence": 0.997 + }, + { + "text": "記", + "start": 31.12, + "end": 31.26, + "confidence": 0.994 + }, + { + "text": "と", + "start": 31.26, + "end": 31.42, + "confidence": 0.722 + }, + { + "text": "も", + "start": 31.42, + "end": 31.54, + "confidence": 0.839 + }, + { + "text": "に", + "start": 31.54, + "end": 31.66, + "confidence": 0.945 + }, + { + "text": "正", + "start": 31.66, + "end": 31.96, + "confidence": 0.481 + }, + { + "text": "しく", + "start": 31.96, + "end": 32.18, + "confidence": 0.999 + }, + { + "text": "ない", + "start": 32.18, + "end": 32.39, + "confidence": 0.938 + } + ] + }, + { + "id": 5, + "seek": 2726, + "start": 32.39, + "end": 36.34, + "text": "以上 時にいいなります こちらいたしても ではありません", + "tokens": [ + 50620, + 29497, + 220, + 6611, + 4108, + 13806, + 3203, + 19420, + 14384, + 28567, + 17679, + 8822, + 4801, + 220, + 16719, + 14498, + 30250, + 50838 + ], + "temperature": 0.0, + "avg_logprob": -0.44616998208535685, + "compression_ratio": 1.375, + "no_speech_prob": 0.3626025915145874, + "confidence": 0.456, + "words": [ + { + "text": "以上", + "start": 32.39, + "end": 32.74, + "confidence": 0.31 + }, + { + "text": " ", + "start": 32.74, + "end": 33.04, + "confidence": 0.128 + }, + { + "text": "時", + "start": 33.04, + "end": 33.1, + "confidence": 0.355 + }, + { + "text": "に", + "start": 33.1, + "end": 33.12, + "confidence": 0.791 + }, + { + "text": "いい", + "start": 33.12, + "end": 33.36, + "confidence": 0.621 + }, + { + "text": "な", + "start": 33.36, + "end": 33.48, + "confidence": 0.793 + }, + { + "text": "ります", + "start": 33.48, + "end": 34.02, + "confidence": 0.896 + }, + { + "text": " こ", + "start": 34.02, + "end": 34.38, + "confidence": 0.328 + }, + { + "text": "ちら", + "start": 34.38, + "end": 34.56, + "confidence": 0.684 + }, + { + "text": "いた", + "start": 34.56, + "end": 34.84, + "confidence": 0.571 + }, + { + "text": "して", + "start": 34.84, + "end": 35.04, + "confidence": 0.437 + }, + { + "text": "も", + "start": 35.04, + "end": 35.18, + "confidence": 0.422 + }, + { + "text": " ", + "start": 35.18, + "end": 35.38, + "confidence": 0.244 + }, + { + "text": "では", + "start": 35.38, + "end": 35.46, + "confidence": 0.139 + }, + { + "text": "あり", + "start": 35.46, + "end": 35.72, + "confidence": 0.903 + }, + { + "text": "ません", + "start": 35.72, + "end": 36.34, + "confidence": 0.997 + } + ] + }, + { + "id": 6, + "seek": 2726, + "start": 36.42, + "end": 40.4, + "text": "パブコンはサプテレクトリーごとに 設定した", + "tokens": [ + 50838, + 23268, + 28889, + 18066, + 4824, + 3065, + 23607, + 20953, + 22985, + 16680, + 10825, + 7588, + 12376, + 3384, + 9991, + 3193, + 4108, + 220, + 39035, + 12088, + 8533, + 51042 + ], + "temperature": 0.0, + "avg_logprob": -0.44616998208535685, + "compression_ratio": 1.375, + "no_speech_prob": 0.3626025915145874, + "confidence": 0.849, + "words": [ + { + "text": "パ", + "start": 36.42, + "end": 36.92, + "confidence": 0.482 + }, + { + "text": "ブ", + "start": 36.92, + "end": 37.04, + "confidence": 0.648 + }, + { + "text": "コ", + "start": 37.04, + "end": 37.2, + "confidence": 0.689 + }, + { + "text": "ン", + "start": 37.2, + "end": 37.72, + "confidence": 0.994 + }, + { + "text": "は", + "start": 37.72, + "end": 37.74, + "confidence": 0.975 + }, + { + "text": "サ", + "start": 37.74, + "end": 38.22, + "confidence": 0.668 + }, + { + "text": "プ", + "start": 38.22, + "end": 38.32, + "confidence": 0.572 + }, + { + "text": "テ", + "start": 38.32, + "end": 38.42, + "confidence": 0.984 + }, + { + "text": "レ", + "start": 38.42, + "end": 38.56, + "confidence": 0.997 + }, + { + "text": "ク", + "start": 38.56, + "end": 38.68, + "confidence": 0.997 + }, + { + "text": "ト", + "start": 38.68, + "end": 38.78, + "confidence": 0.998 + }, + { + "text": "リ", + "start": 38.78, + "end": 38.92, + "confidence": 0.999 + }, + { + "text": "ー", + "start": 38.92, + "end": 38.96, + "confidence": 0.987 + }, + { + "text": "ご", + "start": 38.96, + "end": 39.08, + "confidence": 0.959 + }, + { + "text": "と", + "start": 39.08, + "end": 39.26, + "confidence": 0.999 + }, + { + "text": "に", + "start": 39.26, + "end": 39.58, + "confidence": 0.974 + }, + { + "text": " ", + "start": 39.58, + "end": 39.66, + "confidence": 0.663 + }, + { + "text": "設", + "start": 39.66, + "end": 39.82, + "confidence": 0.911 + }, + { + "text": "定", + "start": 39.82, + "end": 40.02, + "confidence": 0.999 + }, + { + "text": "した", + "start": 40.02, + "end": 40.4, + "confidence": 0.873 + } + ] + } + ], + "language": "Japanese" +} \ No newline at end of file diff --git a/tests/expected/tiny_auto/laugh1.mp3.words.json b/tests/expected/tiny_auto/laugh1.mp3.words.json new file mode 100644 index 0000000000000000000000000000000000000000..cc02e90afb5f0b83143a69184da958427ed4a000 --- /dev/null +++ b/tests/expected/tiny_auto/laugh1.mp3.words.json @@ -0,0 +1,171 @@ +{ + "text": " You can't do it, you can't.", + "segments": [ + { + "id": 0, + "seek": 0, + "start": 0.0, + "end": 1.7, + "text": " You can't do it, you can't.", + "tokens": [ + 50364, + 509, + 393, + 380, + 360, + 309, + 11, + 291, + 393, + 380, + 13, + 50464 + ], + "temperature": 0.0, + "avg_logprob": -1.3003114553598256, + "compression_ratio": 0.9310344827586207, + "no_speech_prob": 0.4180056154727936, + "confidence": 0.277, + "words": [ + { + "text": "You", + "start": 0.0, + "end": 0.56, + "confidence": 0.081 + }, + { + "text": "can't", + "start": 0.56, + "end": 0.82, + "confidence": 0.302 + }, + { + "text": "do", + "start": 0.82, + "end": 1.04, + "confidence": 0.118 + }, + { + "text": "it,", + "start": 1.04, + "end": 1.2, + "confidence": 0.374 + }, + { + "text": "you", + "start": 1.26, + "end": 1.5, + "confidence": 0.141 + }, + { + "text": "can't.", + "start": 1.5, + "end": 1.7, + "confidence": 0.868 + } + ] + } + ], + "language": "en", + "language_probs": { + "en": 0.2290046215057373, + "zh": 0.008879472501575947, + "de": 0.02778141386806965, + "es": 0.03680439293384552, + "ru": 0.018077710643410683, + "ko": 0.06068018823862076, + "fr": 0.05030563846230507, + "ja": 0.027565214782953262, + "pt": 0.053550075739622116, + "tr": 0.052719857543706894, + "pl": 0.02609822154045105, + "ca": 0.0011647333158180118, + "nl": 0.012231990694999695, + "ar": 0.04652511328458786, + "sv": 0.05790143832564354, + "it": 0.018219497054815292, + "id": 0.006198871415108442, + "hi": 0.02866329252719879, + "fi": 0.007714619394391775, + "vi": 0.0017484717536717653, + "he": 0.006247490178793669, + "uk": 0.00416172482073307, + "el": 0.023394295945763588, + "ms": 0.0023163489531725645, + "cs": 0.0035045240074396133, + "ro": 0.003819013712927699, + "da": 0.004903710447251797, + "hu": 0.019854480400681496, + "ta": 0.004097203724086285, + "no": 0.005219973158091307, + "th": 0.006808128207921982, + "ur": 0.03651798143982887, + "hr": 0.000954348302911967, + "bg": 0.0005249864771030843, + "lt": 0.0007880979683250189, + "la": 0.005219973158091307, + "mi": 0.002624767366796732, + "ml": 0.002624767366796732, + "cy": 0.01487031951546669, + "sk": 0.00025685937725938857, + "te": 0.0010814183624461293, + "fa": 0.006496361456811428, + "lv": 0.00022229323803912848, + "bn": 0.0018612387357279658, + "sr": 0.0006533561972901225, + "az": 0.0015190986450761557, + "sl": 0.0012302036629989743, + "kn": 0.00015218414773698896, + "et": 0.0005480361869558692, + "mk": 0.0001639087568037212, + "br": 0.001776006305590272, + "eu": 0.001264306134544313, + "is": 0.0007374632405117154, + "hy": 0.00030862365383654833, + "ne": 0.00043864260078407824, + "mn": 0.0007520083454437554, + "bs": 0.0013617111835628748, + "kk": 8.570168574806303e-05, + "sq": 0.0002609043149277568, + "sw": 0.001304439501836896, + "gl": 0.004827686119824648, + "mr": 0.00020801107166334987, + "pa": 0.0009395524975843728, + "si": 0.0011830752482637763, + "km": 0.0007260299171321094, + "sn": 0.001996817532926798, + "yo": 0.0009035589173436165, + "so": 4.6595199819421396e-05, + "af": 0.0001509998255642131, + "oc": 0.00048175465781241655, + "ka": 0.00022316329705063254, + "be": 0.000393196678487584, + "tg": 3.2651128094585147e-06, + "sd": 0.002860309323295951, + "gu": 0.00046876014675945044, + "am": 8.241849718615413e-05, + "yi": 0.0008259196765720844, + "lo": 7.160643872339278e-05, + "uz": 4.3158429718914704e-08, + "fo": 0.0010941657237708569, + "ht": 0.001555123133584857, + "ps": 0.0002712975547183305, + "tk": 3.5393944131101307e-07, + "nn": 0.007959508337080479, + "mt": 0.0004912564181722701, + "sa": 0.0012892422964796424, + "lb": 7.492898248528945e-07, + "my": 0.00042348948772996664, + "bo": 0.0012398521648719907, + "tl": 0.011401468887925148, + "mg": 4.178579331437504e-07, + "as": 0.0001984855334740132, + "tt": 1.6100466382340528e-06, + "haw": 0.004535190761089325, + "ln": 8.082438580458984e-05, + "ha": 7.570124580524862e-07, + "ba": 2.531344307499239e-07, + "jw": 0.010300369001924992, + "su": 1.0605447187117534e-06 + } +} \ No newline at end of file diff --git a/tests/expected/tiny_auto/laugh2.mp3.words.json b/tests/expected/tiny_auto/laugh2.mp3.words.json new file mode 100644 index 0000000000000000000000000000000000000000..5404314b300353b004f212ff9f0f0b9b3bb91c35 --- /dev/null +++ b/tests/expected/tiny_auto/laugh2.mp3.words.json @@ -0,0 +1,133 @@ +{ + "text": " Haha.", + "segments": [ + { + "id": 0, + "seek": 0, + "start": 0.18, + "end": 0.56, + "text": " Haha.", + "tokens": [ + 50364, + 19131, + 13, + 50401 + ], + "temperature": 0.0, + "avg_logprob": -1.316188430786133, + "compression_ratio": 0.38461538461538464, + "no_speech_prob": 0.5721203088760376, + "confidence": 0.079, + "words": [ + { + "text": "Haha.", + "start": 0.18, + "end": 0.56, + "confidence": 0.079 + } + ] + } + ], + "language": "en", + "language_probs": { + "en": 0.6548641920089722, + "zh": 0.038717932999134064, + "de": 0.025590991601347923, + "es": 0.011994256637990475, + "ru": 0.011355933733284473, + "ko": 0.04633929580450058, + "fr": 0.02422906644642353, + "ja": 0.014243531040847301, + "pt": 0.019468599930405617, + "tr": 0.0092684431001544, + "pl": 0.007989896461367607, + "ca": 0.0003766233567148447, + "nl": 0.02767045982182026, + "ar": 0.0034096697345376015, + "sv": 0.004660465754568577, + "it": 0.0023070976603776217, + "id": 0.0032282101456075907, + "hi": 0.019166767597198486, + "fi": 0.00038405158556997776, + "vi": 0.0028937491588294506, + "he": 0.0006482097669504583, + "uk": 0.0007608000887557864, + "el": 0.0010562663665041327, + "ms": 0.0037156471516937017, + "cs": 0.0018179493490606546, + "ro": 0.003383135423064232, + "da": 0.001361581147648394, + "hu": 0.001269133179448545, + "ta": 0.0015980799216777086, + "no": 0.0012741003884002566, + "th": 0.00850520096719265, + "ur": 0.002117111813277006, + "hr": 0.0002384630497545004, + "bg": 0.00032088710577227175, + "lt": 0.00015098540461622179, + "la": 0.001875657238997519, + "mi": 0.0015489121433347464, + "ml": 0.001011841231957078, + "cy": 0.01327643170952797, + "sk": 0.0001626176672289148, + "te": 0.0011112901847809553, + "fa": 0.0003551896952558309, + "lv": 0.00010540479706833139, + "bn": 0.0016813284019008279, + "sr": 9.122024493990466e-05, + "az": 9.979525930248201e-05, + "sl": 0.0002431663015158847, + "kn": 2.787499215628486e-05, + "et": 4.0085364162223414e-05, + "mk": 3.091512917308137e-05, + "br": 0.0008587384945712984, + "eu": 0.00010057795589091256, + "is": 0.00015577819431200624, + "hy": 0.00014748783723916858, + "ne": 0.00018141313921660185, + "mn": 0.0002681112091522664, + "bs": 0.0002431663015158847, + "kk": 2.7335841878084466e-05, + "sq": 6.172270514070988e-05, + "sw": 0.00029909968725405633, + "gl": 0.0007259605336003006, + "mr": 0.00017310561088379472, + "pa": 8.081665873760357e-05, + "si": 0.0005147830815985799, + "km": 0.0007637778180651367, + "sn": 0.000816219428088516, + "yo": 0.00030619261087849736, + "so": 3.4114727895939723e-06, + "af": 4.6590746933361515e-05, + "oc": 0.00016325415344908834, + "ka": 4.385352076496929e-05, + "be": 7.833019481040537e-05, + "tg": 2.4760939254520054e-07, + "sd": 0.00022054229339119047, + "gu": 8.875974162947387e-05, + "am": 1.856874951045029e-05, + "yi": 0.00012468329805415124, + "lo": 5.362561932997778e-05, + "uz": 3.726850383856117e-09, + "fo": 0.00023022523964755237, + "ht": 0.0003962427144870162, + "ps": 4.604794958140701e-05, + "tk": 2.9428679937382185e-08, + "nn": 0.00637010158970952, + "mt": 3.388737604836933e-05, + "sa": 0.00042015372309833765, + "lb": 1.55556463710127e-07, + "my": 0.00015885064203757793, + "bo": 0.0005587917985394597, + "tl": 0.0009579920442774892, + "mg": 3.7639857453086734e-08, + "as": 4.351224924903363e-05, + "tt": 1.580061166350788e-07, + "haw": 0.0029623722657561302, + "ln": 1.3479466360877268e-05, + "ha": 5.124700308556385e-08, + "ba": 2.5718332352653306e-08, + "jw": 0.0032030881848186255, + "su": 1.0352179913297732e-07 + } +} \ No newline at end of file diff --git a/tests/expected/tiny_auto/punctuations.mp3.words.json b/tests/expected/tiny_auto/punctuations.mp3.words.json new file mode 100644 index 0000000000000000000000000000000000000000..2d18126b77ff7c4b54b4a194d6fce0742720f8be --- /dev/null +++ b/tests/expected/tiny_auto/punctuations.mp3.words.json @@ -0,0 +1,172 @@ +{ + "text": " Dima, est ce que l'on vole ?", + "segments": [ + { + "id": 0, + "seek": 0, + "start": 0.42, + "end": 2.58, + "text": " Dima, est ce que l'on vole ?", + "tokens": [ + 50364, + 413, + 4775, + 11, + 871, + 1769, + 631, + 287, + 6, + 266, + 49877, + 2506, + 50494 + ], + "temperature": 0.0, + "avg_logprob": -0.8432660784040179, + "compression_ratio": 0.7777777777777778, + "no_speech_prob": 0.0010773586109280586, + "confidence": 0.456, + "words": [ + { + "text": "Dima,", + "start": 0.42, + "end": 0.84, + "confidence": 0.247 + }, + { + "text": "est", + "start": 1.2, + "end": 1.4, + "confidence": 0.93 + }, + { + "text": "ce", + "start": 1.4, + "end": 1.56, + "confidence": 0.587 + }, + { + "text": "que", + "start": 1.56, + "end": 1.68, + "confidence": 0.916 + }, + { + "text": "l'on", + "start": 1.68, + "end": 2.02, + "confidence": 0.481 + }, + { + "text": "vole ?", + "start": 2.02, + "end": 2.58, + "confidence": 0.249 + } + ] + } + ], + "language": "fr", + "language_probs": { + "en": 0.0004427048552315682, + "zh": 4.150092354393564e-05, + "de": 8.062254346441478e-05, + "es": 2.3646514819120057e-05, + "ru": 2.6379595510661602e-05, + "ko": 3.101747779510333e-06, + "fr": 0.988398015499115, + "ja": 9.801208216231316e-05, + "pt": 0.001104298629797995, + "tr": 4.841759619012009e-06, + "pl": 1.2756338037434034e-05, + "ca": 6.920935220477986e-07, + "nl": 4.487320256885141e-05, + "ar": 7.114913751138374e-05, + "sv": 2.070558002742473e-05, + "it": 0.001104298629797995, + "id": 8.380914664485317e-07, + "hi": 1.2980614201296703e-06, + "fi": 7.67460761608163e-08, + "vi": 1.0109312142958515e-06, + "he": 0.00013501734065357596, + "uk": 1.5262780550528987e-07, + "el": 2.2388070647139102e-05, + "ms": 2.1869453121325932e-05, + "cs": 2.8241736345080426e-06, + "ro": 1.1890214409504551e-05, + "da": 2.891146777983522e-06, + "hu": 5.8402770264365245e-06, + "ta": 6.398907625992933e-09, + "no": 5.306464458953997e-07, + "th": 1.6217863958445378e-06, + "ur": 1.8377247670287034e-06, + "hr": 1.6565119054234856e-08, + "bg": 3.9280556052290194e-07, + "lt": 1.0570640363027906e-08, + "la": 0.0002483348944224417, + "mi": 3.647076312063291e-07, + "ml": 9.549777857387198e-09, + "cy": 1.612552114238497e-05, + "sk": 1.099336799370576e-07, + "te": 1.5392920271750654e-09, + "fa": 8.348240498889936e-07, + "lv": 1.160957729950951e-08, + "bn": 2.7854085260514694e-07, + "sr": 2.6419332499472148e-08, + "az": 8.428907705138045e-08, + "sl": 1.6473258028781856e-06, + "kn": 9.501843756254402e-10, + "et": 2.3914541458225358e-08, + "mk": 7.015159297907303e-08, + "br": 0.006159283686429262, + "eu": 5.074120508652413e-06, + "is": 4.916538287602634e-08, + "hy": 1.4967571360102738e-07, + "ne": 3.332702558367373e-09, + "mn": 5.39976134916742e-08, + "bs": 3.017182592657264e-08, + "kk": 4.051535995586164e-09, + "sq": 8.852010751070338e-07, + "sw": 8.512894851264718e-07, + "gl": 2.0225936168571934e-05, + "mr": 4.171988976509056e-09, + "pa": 1.5442691392308916e-07, + "si": 4.0212069052358856e-07, + "km": 4.5211646693132934e-07, + "sn": 9.78062416834291e-06, + "yo": 3.778702375711873e-05, + "so": 3.365910217212331e-08, + "af": 1.2073853383753885e-07, + "oc": 0.0013851008843630552, + "ka": 9.43992901625279e-08, + "be": 3.1317190973823017e-07, + "tg": 5.346487252921861e-09, + "sd": 8.413717296207324e-07, + "gu": 1.0570640363027906e-08, + "am": 3.2879388101036966e-08, + "yi": 6.464596935984446e-06, + "lo": 3.0235324288696575e-07, + "uz": 7.551113380410701e-12, + "fo": 1.4766532103749341e-06, + "ht": 0.00015419464034494013, + "ps": 1.3681467692094884e-07, + "tk": 1.9360801850609732e-10, + "nn": 8.1254867836833e-05, + "mt": 3.9127417039708234e-07, + "sa": 1.975150354383004e-07, + "lb": 5.274675629607373e-08, + "my": 1.925918923006975e-06, + "bo": 1.5870780600835133e-07, + "tl": 5.953688742010854e-08, + "mg": 8.492480607635855e-10, + "as": 5.976990280487371e-08, + "tt": 1.1517511389058654e-09, + "haw": 0.00011458773951744661, + "ln": 5.761833017459139e-05, + "ha": 8.982996013706668e-10, + "ba": 3.282146221472715e-10, + "jw": 3.3276894555456238e-06, + "su": 2.5238919287851047e-10 + } +} \ No newline at end of file diff --git a/tests/expected/tiny_auto/radio_short.mp3.words.json b/tests/expected/tiny_auto/radio_short.mp3.words.json new file mode 100644 index 0000000000000000000000000000000000000000..a10f3dc9d16b9207b21ee7c2bbba0081024b834a --- /dev/null +++ b/tests/expected/tiny_auto/radio_short.mp3.words.json @@ -0,0 +1,2934 @@ +{ + "text": " What are you telling me, guys? What are you telling me, dude? What are you telling me, dude? What are you telling me, dude? What are you telling me, guys? What are you telling me, guys? What are you telling me, dude? What are you telling me, dude? The most important thing is not to be alert. It's what you do. Yes, man. The reference of the book. Good evening, good evening. All of you, this is your BFFM TV. It's called the BFFM story with the actuality. There are 60 minutes of the report of the analysis of the actions you need. As you can see, it's a bit of a report of the reports of the reports. So, what is it, guys? So, we are ready to do it. The report is ready to be told by the leaders of the CFT's CFT's CFT's CFT. The report of the CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's C The CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's C", + "segments": [ + { + "id": 0, + "seek": 0, + "start": 5.0, + "end": 6.12, + "text": " What are you telling me, guys?", + "tokens": [ + 50364, + 708, + 366, + 291, + 3585, + 385, + 11, + 1074, + 30, + 50664 + ], + "temperature": 0.0, + "avg_logprob": -0.39804049236018485, + "compression_ratio": 4.660377358490566, + "no_speech_prob": 0.5096546411514282, + "confidence": 0.342, + "words": [ + { + "text": "What", + "start": 5.0, + "end": 5.22, + "confidence": 0.041 + }, + { + "text": "are", + "start": 5.22, + "end": 5.3, + "confidence": 0.602 + }, + { + "text": "you", + "start": 5.3, + "end": 5.46, + "confidence": 0.97 + }, + { + "text": "telling", + "start": 5.46, + "end": 5.7, + "confidence": 0.355 + }, + { + "text": "me,", + "start": 5.7, + "end": 5.94, + "confidence": 0.612 + }, + { + "text": "guys?", + "start": 6.02, + "end": 6.12, + "confidence": 0.304 + } + ] + }, + { + "id": 1, + "seek": 0, + "start": 6.76, + "end": 7.57, + "text": " What are you telling me, dude?", + "tokens": [ + 50664, + 708, + 366, + 291, + 3585, + 385, + 11, + 6449, + 30, + 50764 + ], + "temperature": 0.0, + "avg_logprob": -0.39804049236018485, + "compression_ratio": 4.660377358490566, + "no_speech_prob": 0.5096546411514282, + "confidence": 0.677, + "words": [ + { + "text": "What", + "start": 6.76, + "end": 6.92, + "confidence": 0.884 + }, + { + "text": "are", + "start": 6.92, + "end": 7.06, + "confidence": 0.936 + }, + { + "text": "you", + "start": 7.06, + "end": 7.18, + "confidence": 0.993 + }, + { + "text": "telling", + "start": 7.18, + "end": 7.3, + "confidence": 0.906 + }, + { + "text": "me,", + "start": 7.3, + "end": 7.44, + "confidence": 0.984 + }, + { + "text": "dude?", + "start": 7.48, + "end": 7.57, + "confidence": 0.132 + } + ] + }, + { + "id": 2, + "seek": 0, + "start": 7.57, + "end": 9.36, + "text": " What are you telling me, dude?", + "tokens": [ + 50764, + 708, + 366, + 291, + 3585, + 385, + 11, + 6449, + 30, + 50864 + ], + "temperature": 0.0, + "avg_logprob": -0.39804049236018485, + "compression_ratio": 4.660377358490566, + "no_speech_prob": 0.5096546411514282, + "confidence": 0.826, + "words": [ + { + "text": "What", + "start": 7.57, + "end": 9.12, + "confidence": 0.544 + }, + { + "text": "are", + "start": 9.12, + "end": 9.28, + "confidence": 0.852 + }, + { + "text": "you", + "start": 9.28, + "end": 9.3, + "confidence": 0.994 + }, + { + "text": "telling", + "start": 9.3, + "end": 9.32, + "confidence": 0.849 + }, + { + "text": "me,", + "start": 9.32, + "end": 9.34, + "confidence": 0.951 + }, + { + "text": "dude?", + "start": 9.34, + "end": 9.36, + "confidence": 0.855 + } + ] + }, + { + "id": 3, + "seek": 0, + "start": 11.22, + "end": 12.5, + "text": " What are you telling me, dude?", + "tokens": [ + 50864, + 708, + 366, + 291, + 3585, + 385, + 11, + 6449, + 30, + 50964 + ], + "temperature": 0.0, + "avg_logprob": -0.39804049236018485, + "compression_ratio": 4.660377358490566, + "no_speech_prob": 0.5096546411514282, + "confidence": 0.774, + "words": [ + { + "text": "What", + "start": 11.22, + "end": 11.44, + "confidence": 0.423 + }, + { + "text": "are", + "start": 11.44, + "end": 11.56, + "confidence": 0.791 + }, + { + "text": "you", + "start": 11.56, + "end": 11.68, + "confidence": 0.994 + }, + { + "text": "telling", + "start": 11.68, + "end": 11.7, + "confidence": 0.809 + }, + { + "text": "me,", + "start": 11.7, + "end": 12.48, + "confidence": 0.956 + }, + { + "text": "dude?", + "start": 12.48, + "end": 12.5, + "confidence": 0.837 + } + ] + }, + { + "id": 4, + "seek": 0, + "start": 12.5, + "end": 13.54, + "text": " What are you telling me, guys?", + "tokens": [ + 50964, + 708, + 366, + 291, + 3585, + 385, + 11, + 1074, + 30, + 51164 + ], + "temperature": 0.0, + "avg_logprob": -0.39804049236018485, + "compression_ratio": 4.660377358490566, + "no_speech_prob": 0.5096546411514282, + "confidence": 0.76, + "words": [ + { + "text": "What", + "start": 12.5, + "end": 12.52, + "confidence": 0.504 + }, + { + "text": "are", + "start": 12.52, + "end": 12.54, + "confidence": 0.845 + }, + { + "text": "you", + "start": 12.54, + "end": 12.64, + "confidence": 0.994 + }, + { + "text": "telling", + "start": 12.64, + "end": 12.66, + "confidence": 0.844 + }, + { + "text": "me,", + "start": 12.66, + "end": 13.04, + "confidence": 0.962 + }, + { + "text": "guys?", + "start": 13.52, + "end": 13.54, + "confidence": 0.563 + } + ] + }, + { + "id": 5, + "seek": 0, + "start": 20.32, + "end": 21.4, + "text": " What are you telling me, guys?", + "tokens": [ + 51164, + 708, + 366, + 291, + 3585, + 385, + 11, + 1074, + 30, + 51414 + ], + "temperature": 0.0, + "avg_logprob": -0.39804049236018485, + "compression_ratio": 4.660377358490566, + "no_speech_prob": 0.5096546411514282, + "confidence": 0.935, + "words": [ + { + "text": "What", + "start": 20.32, + "end": 20.72, + "confidence": 0.885 + }, + { + "text": "are", + "start": 20.72, + "end": 20.78, + "confidence": 0.936 + }, + { + "text": "you", + "start": 20.78, + "end": 20.8, + "confidence": 0.996 + }, + { + "text": "telling", + "start": 20.8, + "end": 21.04, + "confidence": 0.935 + }, + { + "text": "me,", + "start": 21.04, + "end": 21.3, + "confidence": 0.896 + }, + { + "text": "guys?", + "start": 21.38, + "end": 21.4, + "confidence": 0.969 + } + ] + }, + { + "id": 6, + "seek": 0, + "start": 22.08, + "end": 22.96, + "text": " What are you telling me, dude?", + "tokens": [ + 51414, + 708, + 366, + 291, + 3585, + 385, + 11, + 6449, + 30, + 51514 + ], + "temperature": 0.0, + "avg_logprob": -0.39804049236018485, + "compression_ratio": 4.660377358490566, + "no_speech_prob": 0.5096546411514282, + "confidence": 0.953, + "words": [ + { + "text": "What", + "start": 22.08, + "end": 22.24, + "confidence": 0.95 + }, + { + "text": "are", + "start": 22.24, + "end": 22.36, + "confidence": 0.965 + }, + { + "text": "you", + "start": 22.36, + "end": 22.44, + "confidence": 0.997 + }, + { + "text": "telling", + "start": 22.44, + "end": 22.6, + "confidence": 0.864 + }, + { + "text": "me,", + "start": 22.6, + "end": 22.78, + "confidence": 0.984 + }, + { + "text": "dude?", + "start": 22.94, + "end": 22.96, + "confidence": 0.967 + } + ] + }, + { + "id": 7, + "seek": 0, + "start": 22.96, + "end": 23.08, + "text": " What are you telling me, dude?", + "tokens": [ + 51514, + 708, + 366, + 291, + 3585, + 385, + 11, + 6449, + 30, + 51664 + ], + "temperature": 0.0, + "avg_logprob": -0.39804049236018485, + "compression_ratio": 4.660377358490566, + "no_speech_prob": 0.5096546411514282, + "confidence": 0.856, + "words": [ + { + "text": "What", + "start": 22.96, + "end": 22.98, + "confidence": 0.541 + }, + { + "text": "are", + "start": 22.98, + "end": 23.0, + "confidence": 0.889 + }, + { + "text": "you", + "start": 23.0, + "end": 23.02, + "confidence": 0.996 + }, + { + "text": "telling", + "start": 23.02, + "end": 23.04, + "confidence": 0.882 + }, + { + "text": "me,", + "start": 23.04, + "end": 23.06, + "confidence": 0.975 + }, + { + "text": "dude?", + "start": 23.06, + "end": 23.08, + "confidence": 0.955 + } + ] + }, + { + "id": 8, + "seek": 2600, + "start": 26.54, + "end": 32.48, + "text": " The most important thing is not to be alert.", + "tokens": [ + 50414, + 440, + 881, + 1021, + 551, + 307, + 406, + 281, + 312, + 9615, + 13, + 50664 + ], + "temperature": 0.0, + "avg_logprob": -0.9188781111207727, + "compression_ratio": 1.3594771241830066, + "no_speech_prob": 0.09051438421010971, + "confidence": 0.276, + "words": [ + { + "text": "The", + "start": 26.54, + "end": 31.02, + "confidence": 0.182 + }, + { + "text": "most", + "start": 31.02, + "end": 31.18, + "confidence": 0.518 + }, + { + "text": "important", + "start": 31.18, + "end": 31.5, + "confidence": 0.995 + }, + { + "text": "thing", + "start": 31.5, + "end": 31.68, + "confidence": 0.217 + }, + { + "text": "is", + "start": 31.68, + "end": 31.9, + "confidence": 0.507 + }, + { + "text": "not", + "start": 31.9, + "end": 32.22, + "confidence": 0.284 + }, + { + "text": "to", + "start": 32.22, + "end": 32.4, + "confidence": 0.343 + }, + { + "text": "be", + "start": 32.4, + "end": 32.42, + "confidence": 0.247 + }, + { + "text": "alert.", + "start": 32.42, + "end": 32.48, + "confidence": 0.038 + } + ] + }, + { + "id": 9, + "seek": 2600, + "start": 33.42, + "end": 34.06, + "text": " It's what you do.", + "tokens": [ + 50664, + 467, + 311, + 437, + 291, + 360, + 13, + 50764 + ], + "temperature": 0.0, + "avg_logprob": -0.9188781111207727, + "compression_ratio": 1.3594771241830066, + "no_speech_prob": 0.09051438421010971, + "confidence": 0.502, + "words": [ + { + "text": "It's", + "start": 33.42, + "end": 33.64, + "confidence": 0.307 + }, + { + "text": "what", + "start": 33.64, + "end": 33.72, + "confidence": 0.616 + }, + { + "text": "you", + "start": 33.72, + "end": 33.88, + "confidence": 0.898 + }, + { + "text": "do.", + "start": 33.88, + "end": 34.06, + "confidence": 0.614 + } + ] + }, + { + "id": 10, + "seek": 2600, + "start": 34.86, + "end": 35.5, + "text": " Yes, man.", + "tokens": [ + 50764, + 1079, + 11, + 587, + 13, + 50864 + ], + "temperature": 0.0, + "avg_logprob": -0.9188781111207727, + "compression_ratio": 1.3594771241830066, + "no_speech_prob": 0.09051438421010971, + "confidence": 0.088, + "words": [ + { + "text": "Yes,", + "start": 34.86, + "end": 34.88, + "confidence": 0.065 + }, + { + "text": "man.", + "start": 35.48, + "end": 35.5, + "confidence": 0.12 + } + ] + }, + { + "id": 11, + "seek": 2600, + "start": 37.14, + "end": 38.64, + "text": " The reference of the book.", + "tokens": [ + 50864, + 440, + 6408, + 295, + 264, + 1446, + 13, + 51014 + ], + "temperature": 0.0, + "avg_logprob": -0.9188781111207727, + "compression_ratio": 1.3594771241830066, + "no_speech_prob": 0.09051438421010971, + "confidence": 0.268, + "words": [ + { + "text": "The", + "start": 37.14, + "end": 37.28, + "confidence": 0.385 + }, + { + "text": "reference", + "start": 37.28, + "end": 37.74, + "confidence": 0.543 + }, + { + "text": "of", + "start": 37.74, + "end": 37.92, + "confidence": 0.781 + }, + { + "text": "the", + "start": 37.92, + "end": 38.2, + "confidence": 0.37 + }, + { + "text": "book.", + "start": 38.2, + "end": 38.64, + "confidence": 0.023 + } + ] + }, + { + "id": 12, + "seek": 2600, + "start": 44.94, + "end": 45.65, + "text": " Good evening, good evening.", + "tokens": [ + 51264, + 2205, + 5634, + 11, + 665, + 5634, + 13, + 51364 + ], + "temperature": 0.0, + "avg_logprob": -0.9188781111207727, + "compression_ratio": 1.3594771241830066, + "no_speech_prob": 0.09051438421010971, + "confidence": 0.398, + "words": [ + { + "text": "Good", + "start": 44.94, + "end": 45.16, + "confidence": 0.134 + }, + { + "text": "evening,", + "start": 45.16, + "end": 45.4, + "confidence": 0.782 + }, + { + "text": "good", + "start": 45.46, + "end": 45.58, + "confidence": 0.328 + }, + { + "text": "evening.", + "start": 45.58, + "end": 45.65, + "confidence": 0.733 + } + ] + }, + { + "id": 13, + "seek": 2600, + "start": 45.65, + "end": 47.76, + "text": " All of you, this is your BFFM TV.", + "tokens": [ + 51364, + 1057, + 295, + 291, + 11, + 341, + 307, + 428, + 363, + 6345, + 44, + 3558, + 13, + 51464 + ], + "temperature": 0.0, + "avg_logprob": -0.9188781111207727, + "compression_ratio": 1.3594771241830066, + "no_speech_prob": 0.09051438421010971, + "confidence": 0.327, + "words": [ + { + "text": "All", + "start": 45.65, + "end": 46.28, + "confidence": 0.146 + }, + { + "text": "of", + "start": 46.28, + "end": 46.3, + "confidence": 0.355 + }, + { + "text": "you,", + "start": 46.3, + "end": 46.5, + "confidence": 0.953 + }, + { + "text": "this", + "start": 46.54, + "end": 46.68, + "confidence": 0.226 + }, + { + "text": "is", + "start": 46.68, + "end": 46.82, + "confidence": 0.254 + }, + { + "text": "your", + "start": 46.82, + "end": 47.08, + "confidence": 0.184 + }, + { + "text": "BFFM", + "start": 47.08, + "end": 47.62, + "confidence": 0.326 + }, + { + "text": "TV.", + "start": 47.62, + "end": 47.76, + "confidence": 0.775 + } + ] + }, + { + "id": 14, + "seek": 2600, + "start": 47.76, + "end": 51.42, + "text": " It's called the BFFM story with the actuality.", + "tokens": [ + 51464, + 467, + 311, + 1219, + 264, + 363, + 6345, + 44, + 1657, + 365, + 264, + 3539, + 507, + 13, + 51664 + ], + "temperature": 0.0, + "avg_logprob": -0.9188781111207727, + "compression_ratio": 1.3594771241830066, + "no_speech_prob": 0.09051438421010971, + "confidence": 0.385, + "words": [ + { + "text": "It's", + "start": 47.76, + "end": 48.22, + "confidence": 0.351 + }, + { + "text": "called", + "start": 48.22, + "end": 48.38, + "confidence": 0.215 + }, + { + "text": "the", + "start": 48.38, + "end": 48.72, + "confidence": 0.207 + }, + { + "text": "BFFM", + "start": 48.72, + "end": 49.8, + "confidence": 0.849 + }, + { + "text": "story", + "start": 49.8, + "end": 50.06, + "confidence": 0.467 + }, + { + "text": "with", + "start": 50.06, + "end": 50.22, + "confidence": 0.368 + }, + { + "text": "the", + "start": 50.22, + "end": 50.66, + "confidence": 0.179 + }, + { + "text": "actuality.", + "start": 50.66, + "end": 51.42, + "confidence": 0.322 + } + ] + }, + { + "id": 15, + "seek": 5200, + "start": 52.0, + "end": 56.02, + "text": " There are 60 minutes of the report of the analysis of the actions you need.", + "tokens": [ + 50364, + 821, + 366, + 4060, + 2077, + 295, + 264, + 2275, + 295, + 264, + 5215, + 295, + 264, + 5909, + 291, + 643, + 13, + 50564 + ], + "temperature": 0.0, + "avg_logprob": -0.4928334554036458, + "compression_ratio": 3.419753086419753, + "no_speech_prob": 0.2597074508666992, + "confidence": 0.299, + "words": [ + { + "text": "There", + "start": 52.0, + "end": 52.16, + "confidence": 0.088 + }, + { + "text": "are", + "start": 52.16, + "end": 52.3, + "confidence": 0.683 + }, + { + "text": "60", + "start": 52.3, + "end": 52.7, + "confidence": 0.201 + }, + { + "text": "minutes", + "start": 52.7, + "end": 53.12, + "confidence": 0.804 + }, + { + "text": "of", + "start": 53.12, + "end": 53.74, + "confidence": 0.217 + }, + { + "text": "the", + "start": 53.74, + "end": 53.86, + "confidence": 0.16 + }, + { + "text": "report", + "start": 53.86, + "end": 54.16, + "confidence": 0.072 + }, + { + "text": "of", + "start": 54.16, + "end": 54.4, + "confidence": 0.56 + }, + { + "text": "the", + "start": 54.4, + "end": 54.52, + "confidence": 0.584 + }, + { + "text": "analysis", + "start": 54.52, + "end": 54.7, + "confidence": 0.128 + }, + { + "text": "of", + "start": 54.7, + "end": 54.82, + "confidence": 0.838 + }, + { + "text": "the", + "start": 54.82, + "end": 55.22, + "confidence": 0.549 + }, + { + "text": "actions", + "start": 55.22, + "end": 55.24, + "confidence": 0.321 + }, + { + "text": "you", + "start": 55.24, + "end": 55.66, + "confidence": 0.557 + }, + { + "text": "need.", + "start": 55.66, + "end": 56.02, + "confidence": 0.163 + } + ] + }, + { + "id": 16, + "seek": 5200, + "start": 56.7, + "end": 59.8, + "text": " As you can see, it's a bit of a report of the reports of the reports.", + "tokens": [ + 50564, + 1018, + 291, + 393, + 536, + 11, + 309, + 311, + 257, + 857, + 295, + 257, + 2275, + 295, + 264, + 7122, + 295, + 264, + 7122, + 13, + 50764 + ], + "temperature": 0.0, + "avg_logprob": -0.4928334554036458, + "compression_ratio": 3.419753086419753, + "no_speech_prob": 0.2597074508666992, + "confidence": 0.287, + "words": [ + { + "text": "As", + "start": 56.7, + "end": 56.9, + "confidence": 0.289 + }, + { + "text": "you", + "start": 56.9, + "end": 56.96, + "confidence": 0.158 + }, + { + "text": "can", + "start": 56.96, + "end": 57.34, + "confidence": 0.266 + }, + { + "text": "see,", + "start": 57.34, + "end": 57.36, + "confidence": 0.922 + }, + { + "text": "it's", + "start": 57.64, + "end": 57.66, + "confidence": 0.309 + }, + { + "text": "a", + "start": 57.66, + "end": 57.68, + "confidence": 0.456 + }, + { + "text": "bit", + "start": 57.68, + "end": 57.7, + "confidence": 0.491 + }, + { + "text": "of", + "start": 57.7, + "end": 57.96, + "confidence": 0.106 + }, + { + "text": "a", + "start": 57.96, + "end": 58.1, + "confidence": 0.441 + }, + { + "text": "report", + "start": 58.1, + "end": 59.06, + "confidence": 0.058 + }, + { + "text": "of", + "start": 59.06, + "end": 59.32, + "confidence": 0.53 + }, + { + "text": "the", + "start": 59.32, + "end": 59.46, + "confidence": 0.706 + }, + { + "text": "reports", + "start": 59.46, + "end": 59.72, + "confidence": 0.095 + }, + { + "text": "of", + "start": 59.72, + "end": 59.76, + "confidence": 0.291 + }, + { + "text": "the", + "start": 59.76, + "end": 59.78, + "confidence": 0.746 + }, + { + "text": "reports.", + "start": 59.78, + "end": 59.8, + "confidence": 0.123 + } + ] + }, + { + "id": 17, + "seek": 5200, + "start": 59.8, + "end": 60.62, + "text": " So, what is it, guys?", + "tokens": [ + 50764, + 407, + 11, + 437, + 307, + 309, + 11, + 1074, + 30, + 50814 + ], + "temperature": 0.0, + "avg_logprob": -0.4928334554036458, + "compression_ratio": 3.419753086419753, + "no_speech_prob": 0.2597074508666992, + "confidence": 0.234, + "words": [ + { + "text": "So,", + "start": 59.8, + "end": 60.02, + "confidence": 0.153 + }, + { + "text": "what", + "start": 60.18, + "end": 60.2, + "confidence": 0.266 + }, + { + "text": "is", + "start": 60.2, + "end": 60.42, + "confidence": 0.34 + }, + { + "text": "it,", + "start": 60.42, + "end": 60.58, + "confidence": 0.189 + }, + { + "text": "guys?", + "start": 60.58, + "end": 60.62, + "confidence": 0.267 + } + ] + }, + { + "id": 18, + "seek": 5200, + "start": 60.62, + "end": 62.98, + "text": " So, we are ready to do it.", + "tokens": [ + 50814, + 407, + 11, + 321, + 366, + 1919, + 281, + 360, + 309, + 13, + 50914 + ], + "temperature": 0.0, + "avg_logprob": -0.4928334554036458, + "compression_ratio": 3.419753086419753, + "no_speech_prob": 0.2597074508666992, + "confidence": 0.393, + "words": [ + { + "text": "So,", + "start": 60.62, + "end": 62.06, + "confidence": 0.172 + }, + { + "text": "we", + "start": 62.08, + "end": 62.26, + "confidence": 0.36 + }, + { + "text": "are", + "start": 62.26, + "end": 62.44, + "confidence": 0.246 + }, + { + "text": "ready", + "start": 62.44, + "end": 62.68, + "confidence": 0.477 + }, + { + "text": "to", + "start": 62.68, + "end": 62.7, + "confidence": 0.886 + }, + { + "text": "do", + "start": 62.7, + "end": 62.92, + "confidence": 0.589 + }, + { + "text": "it.", + "start": 62.92, + "end": 62.98, + "confidence": 0.381 + } + ] + }, + { + "id": 19, + "seek": 5200, + "start": 63.0, + "end": 66.94, + "text": " The report is ready to be told by the leaders of the CFT's CFT's CFT's CFT.", + "tokens": [ + 50914, + 440, + 2275, + 307, + 1919, + 281, + 312, + 1907, + 538, + 264, + 3523, + 295, + 264, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 13, + 51114 + ], + "temperature": 0.0, + "avg_logprob": -0.4928334554036458, + "compression_ratio": 3.419753086419753, + "no_speech_prob": 0.2597074508666992, + "confidence": 0.35, + "words": [ + { + "text": "The", + "start": 63.0, + "end": 63.44, + "confidence": 0.495 + }, + { + "text": "report", + "start": 63.44, + "end": 63.46, + "confidence": 0.387 + }, + { + "text": "is", + "start": 63.46, + "end": 63.62, + "confidence": 0.522 + }, + { + "text": "ready", + "start": 63.62, + "end": 63.88, + "confidence": 0.055 + }, + { + "text": "to", + "start": 63.88, + "end": 64.26, + "confidence": 0.458 + }, + { + "text": "be", + "start": 64.26, + "end": 64.68, + "confidence": 0.209 + }, + { + "text": "told", + "start": 64.68, + "end": 64.7, + "confidence": 0.047 + }, + { + "text": "by", + "start": 64.7, + "end": 65.04, + "confidence": 0.645 + }, + { + "text": "the", + "start": 65.04, + "end": 65.08, + "confidence": 0.891 + }, + { + "text": "leaders", + "start": 65.08, + "end": 65.46, + "confidence": 0.569 + }, + { + "text": "of", + "start": 65.46, + "end": 65.94, + "confidence": 0.835 + }, + { + "text": "the", + "start": 65.94, + "end": 66.02, + "confidence": 0.738 + }, + { + "text": "CFT's", + "start": 66.02, + "end": 66.36, + "confidence": 0.098 + }, + { + "text": "CFT's", + "start": 66.36, + "end": 66.62, + "confidence": 0.406 + }, + { + "text": "CFT's", + "start": 66.62, + "end": 66.64, + "confidence": 0.512 + }, + { + "text": "CFT.", + "start": 66.64, + "end": 66.94, + "confidence": 0.876 + } + ] + }, + { + "id": 20, + "seek": 6700, + "start": 67.0, + "end": 97.0, + "text": " The report of the CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's C", + "tokens": [ + 50364, + 440, + 2275, + 295, + 264, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383 + ], + "temperature": 0.0, + "avg_logprob": -0.09771199932012857, + "compression_ratio": 13.264705882352942, + "no_speech_prob": 0.7763262987136841, + "confidence": 0.908, + "words": [ + { + "text": "The", + "start": 67.0, + "end": 67.84, + "confidence": 0.342 + }, + { + "text": "report", + "start": 67.84, + "end": 67.86, + "confidence": 0.626 + }, + { + "text": "of", + "start": 67.86, + "end": 68.16, + "confidence": 0.375 + }, + { + "text": "the", + "start": 68.16, + "end": 68.36, + "confidence": 0.865 + }, + { + "text": "CFT's", + "start": 68.36, + "end": 68.68, + "confidence": 0.859 + }, + { + "text": "CFT's", + "start": 68.68, + "end": 68.82, + "confidence": 0.845 + }, + { + "text": "CFT's", + "start": 68.82, + "end": 68.94, + "confidence": 0.816 + }, + { + "text": "CFT's", + "start": 68.94, + "end": 69.04, + "confidence": 0.814 + }, + { + "text": "CFT's", + "start": 69.04, + "end": 69.24, + "confidence": 0.828 + }, + { + "text": "CFT's", + "start": 69.24, + "end": 69.64, + "confidence": 0.852 + }, + { + "text": "CFT's", + "start": 69.64, + "end": 69.88, + "confidence": 0.881 + }, + { + "text": "CFT's", + "start": 69.88, + "end": 70.34, + "confidence": 0.888 + }, + { + "text": "CFT's", + "start": 70.34, + "end": 70.92, + "confidence": 0.899 + }, + { + "text": "CFT's", + "start": 70.92, + "end": 71.62, + "confidence": 0.9 + }, + { + "text": "CFT's", + "start": 71.62, + "end": 73.26, + "confidence": 0.897 + }, + { + "text": "CFT's", + "start": 73.26, + "end": 74.0, + "confidence": 0.9 + }, + { + "text": "CFT's", + "start": 74.0, + "end": 74.4, + "confidence": 0.9 + }, + { + "text": "CFT's", + "start": 74.4, + "end": 74.96, + "confidence": 0.902 + }, + { + "text": "CFT's", + "start": 74.96, + "end": 76.3, + "confidence": 0.904 + }, + { + "text": "CFT's", + "start": 76.3, + "end": 76.32, + "confidence": 0.902 + }, + { + "text": "CFT's", + "start": 76.32, + "end": 76.38, + "confidence": 0.9 + }, + { + "text": "CFT's", + "start": 76.38, + "end": 76.5, + "confidence": 0.904 + }, + { + "text": "CFT's", + "start": 76.5, + "end": 77.4, + "confidence": 0.901 + }, + { + "text": "CFT's", + "start": 77.4, + "end": 77.42, + "confidence": 0.901 + }, + { + "text": "CFT's", + "start": 77.42, + "end": 78.0, + "confidence": 0.899 + }, + { + "text": "CFT's", + "start": 78.0, + "end": 78.02, + "confidence": 0.899 + }, + { + "text": "CFT's", + "start": 78.02, + "end": 78.06, + "confidence": 0.902 + }, + { + "text": "CFT's", + "start": 78.06, + "end": 78.08, + "confidence": 0.903 + }, + { + "text": "CFT's", + "start": 78.08, + "end": 78.1, + "confidence": 0.902 + }, + { + "text": "CFT's", + "start": 78.1, + "end": 78.98, + "confidence": 0.904 + }, + { + "text": "CFT's", + "start": 78.98, + "end": 79.24, + "confidence": 0.903 + }, + { + "text": "CFT's", + "start": 79.24, + "end": 81.7, + "confidence": 0.906 + }, + { + "text": "CFT's", + "start": 81.7, + "end": 81.72, + "confidence": 0.906 + }, + { + "text": "CFT's", + "start": 81.72, + "end": 81.94, + "confidence": 0.91 + }, + { + "text": "CFT's", + "start": 81.94, + "end": 82.32, + "confidence": 0.916 + }, + { + "text": "CFT's", + "start": 82.32, + "end": 82.34, + "confidence": 0.916 + }, + { + "text": "CFT's", + "start": 82.34, + "end": 82.36, + "confidence": 0.916 + }, + { + "text": "CFT's", + "start": 82.36, + "end": 82.44, + "confidence": 0.919 + }, + { + "text": "CFT's", + "start": 82.44, + "end": 82.54, + "confidence": 0.918 + }, + { + "text": "CFT's", + "start": 82.54, + "end": 82.56, + "confidence": 0.923 + }, + { + "text": "CFT's", + "start": 82.56, + "end": 82.58, + "confidence": 0.922 + }, + { + "text": "CFT's", + "start": 82.58, + "end": 82.6, + "confidence": 0.922 + }, + { + "text": "CFT's", + "start": 82.6, + "end": 82.62, + "confidence": 0.927 + }, + { + "text": "CFT's", + "start": 82.62, + "end": 82.68, + "confidence": 0.928 + }, + { + "text": "CFT's", + "start": 82.68, + "end": 83.12, + "confidence": 0.931 + }, + { + "text": "CFT's", + "start": 83.12, + "end": 83.24, + "confidence": 0.933 + }, + { + "text": "CFT's", + "start": 83.24, + "end": 83.54, + "confidence": 0.93 + }, + { + "text": "CFT's", + "start": 83.54, + "end": 83.56, + "confidence": 0.935 + }, + { + "text": "CFT's", + "start": 83.56, + "end": 83.58, + "confidence": 0.932 + }, + { + "text": "CFT's", + "start": 83.58, + "end": 83.7, + "confidence": 0.936 + }, + { + "text": "CFT's", + "start": 83.7, + "end": 83.72, + "confidence": 0.938 + }, + { + "text": "CFT's", + "start": 83.72, + "end": 83.74, + "confidence": 0.94 + }, + { + "text": "CFT's", + "start": 83.74, + "end": 83.76, + "confidence": 0.942 + }, + { + "text": "CFT's", + "start": 83.76, + "end": 83.78, + "confidence": 0.939 + }, + { + "text": "CFT's", + "start": 83.78, + "end": 84.02, + "confidence": 0.947 + }, + { + "text": "CFT's", + "start": 84.02, + "end": 84.04, + "confidence": 0.945 + }, + { + "text": "CFT's", + "start": 84.04, + "end": 84.28, + "confidence": 0.947 + }, + { + "text": "CFT's", + "start": 84.28, + "end": 84.4, + "confidence": 0.948 + }, + { + "text": "CFT's", + "start": 84.4, + "end": 84.54, + "confidence": 0.952 + }, + { + "text": "CFT's", + "start": 84.54, + "end": 84.56, + "confidence": 0.954 + }, + { + "text": "CFT's", + "start": 84.56, + "end": 84.58, + "confidence": 0.956 + }, + { + "text": "CFT's", + "start": 84.58, + "end": 85.02, + "confidence": 0.954 + }, + { + "text": "CFT's", + "start": 85.02, + "end": 85.98, + "confidence": 0.954 + }, + { + "text": "CFT's", + "start": 85.98, + "end": 86.62, + "confidence": 0.954 + }, + { + "text": "CFT's", + "start": 86.62, + "end": 86.8, + "confidence": 0.952 + }, + { + "text": "CFT's", + "start": 86.8, + "end": 87.28, + "confidence": 0.95 + }, + { + "text": "CFT's", + "start": 87.28, + "end": 87.58, + "confidence": 0.952 + }, + { + "text": "CFT's", + "start": 87.58, + "end": 87.66, + "confidence": 0.951 + }, + { + "text": "CFT's", + "start": 87.66, + "end": 87.68, + "confidence": 0.952 + }, + { + "text": "CFT's", + "start": 87.68, + "end": 87.7, + "confidence": 0.954 + }, + { + "text": "CFT's", + "start": 87.7, + "end": 88.84, + "confidence": 0.949 + }, + { + "text": "CFT's", + "start": 88.84, + "end": 88.86, + "confidence": 0.948 + }, + { + "text": "CFT's", + "start": 88.86, + "end": 89.2, + "confidence": 0.95 + }, + { + "text": "CFT's", + "start": 89.2, + "end": 90.42, + "confidence": 0.954 + }, + { + "text": "CFT's", + "start": 90.42, + "end": 90.82, + "confidence": 0.951 + }, + { + "text": "CFT's", + "start": 90.82, + "end": 96.98, + "confidence": 0.95 + }, + { + "text": "C", + "start": 96.98, + "end": 97.0, + "confidence": 0.974 + } + ] + }, + { + "id": 21, + "seek": 9700, + "start": 97.0, + "end": 127.0, + "text": " The CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's CFT's C", + "tokens": [ + 50364, + 440, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383, + 25469, + 311, + 383 + ], + "temperature": 0.0, + "avg_logprob": -0.046164204721493574, + "compression_ratio": 21.095238095238095, + "no_speech_prob": 0.1808893084526062, + "confidence": 0.955, + "words": [ + { + "text": "The", + "start": 97.0, + "end": 97.94, + "confidence": 0.245 + }, + { + "text": "CFT's", + "start": 97.94, + "end": 97.96, + "confidence": 0.471 + }, + { + "text": "CFT's", + "start": 97.96, + "end": 99.74, + "confidence": 0.915 + }, + { + "text": "CFT's", + "start": 99.74, + "end": 102.98, + "confidence": 0.915 + }, + { + "text": "CFT's", + "start": 102.98, + "end": 104.02, + "confidence": 0.918 + }, + { + "text": "CFT's", + "start": 104.02, + "end": 104.12, + "confidence": 0.93 + }, + { + "text": "CFT's", + "start": 104.12, + "end": 104.28, + "confidence": 0.94 + }, + { + "text": "CFT's", + "start": 104.28, + "end": 104.3, + "confidence": 0.95 + }, + { + "text": "CFT's", + "start": 104.3, + "end": 104.82, + "confidence": 0.96 + }, + { + "text": "CFT's", + "start": 104.82, + "end": 105.08, + "confidence": 0.965 + }, + { + "text": "CFT's", + "start": 105.08, + "end": 105.94, + "confidence": 0.967 + }, + { + "text": "CFT's", + "start": 105.94, + "end": 106.88, + "confidence": 0.969 + }, + { + "text": "CFT's", + "start": 106.88, + "end": 108.96, + "confidence": 0.97 + }, + { + "text": "CFT's", + "start": 108.96, + "end": 108.98, + "confidence": 0.971 + }, + { + "text": "CFT's", + "start": 108.98, + "end": 109.06, + "confidence": 0.971 + }, + { + "text": "CFT's", + "start": 109.06, + "end": 109.7, + "confidence": 0.971 + }, + { + "text": "CFT's", + "start": 109.7, + "end": 109.72, + "confidence": 0.971 + }, + { + "text": "CFT's", + "start": 109.72, + "end": 110.12, + "confidence": 0.97 + }, + { + "text": "CFT's", + "start": 110.12, + "end": 110.44, + "confidence": 0.971 + }, + { + "text": "CFT's", + "start": 110.44, + "end": 110.82, + "confidence": 0.973 + }, + { + "text": "CFT's", + "start": 110.82, + "end": 110.84, + "confidence": 0.973 + }, + { + "text": "CFT's", + "start": 110.84, + "end": 110.86, + "confidence": 0.974 + }, + { + "text": "CFT's", + "start": 110.86, + "end": 110.88, + "confidence": 0.973 + }, + { + "text": "CFT's", + "start": 110.88, + "end": 110.9, + "confidence": 0.972 + }, + { + "text": "CFT's", + "start": 110.9, + "end": 111.54, + "confidence": 0.972 + }, + { + "text": "CFT's", + "start": 111.54, + "end": 111.76, + "confidence": 0.971 + }, + { + "text": "CFT's", + "start": 111.76, + "end": 111.78, + "confidence": 0.971 + }, + { + "text": "CFT's", + "start": 111.78, + "end": 111.8, + "confidence": 0.971 + }, + { + "text": "CFT's", + "start": 111.8, + "end": 111.82, + "confidence": 0.972 + }, + { + "text": "CFT's", + "start": 111.82, + "end": 111.84, + "confidence": 0.973 + }, + { + "text": "CFT's", + "start": 111.84, + "end": 111.86, + "confidence": 0.973 + }, + { + "text": "CFT's", + "start": 111.86, + "end": 111.88, + "confidence": 0.973 + }, + { + "text": "CFT's", + "start": 111.88, + "end": 111.9, + "confidence": 0.974 + }, + { + "text": "CFT's", + "start": 111.9, + "end": 111.92, + "confidence": 0.974 + }, + { + "text": "CFT's", + "start": 111.92, + "end": 111.94, + "confidence": 0.974 + }, + { + "text": "CFT's", + "start": 111.94, + "end": 111.96, + "confidence": 0.974 + }, + { + "text": "CFT's", + "start": 111.96, + "end": 111.98, + "confidence": 0.974 + }, + { + "text": "CFT's", + "start": 111.98, + "end": 112.0, + "confidence": 0.976 + }, + { + "text": "CFT's", + "start": 112.0, + "end": 112.02, + "confidence": 0.975 + }, + { + "text": "CFT's", + "start": 112.02, + "end": 112.04, + "confidence": 0.975 + }, + { + "text": "CFT's", + "start": 112.04, + "end": 112.58, + "confidence": 0.977 + }, + { + "text": "CFT's", + "start": 112.58, + "end": 112.76, + "confidence": 0.976 + }, + { + "text": "CFT's", + "start": 112.76, + "end": 112.78, + "confidence": 0.978 + }, + { + "text": "CFT's", + "start": 112.78, + "end": 112.8, + "confidence": 0.978 + }, + { + "text": "CFT's", + "start": 112.8, + "end": 112.82, + "confidence": 0.977 + }, + { + "text": "CFT's", + "start": 112.82, + "end": 112.84, + "confidence": 0.979 + }, + { + "text": "CFT's", + "start": 112.84, + "end": 112.86, + "confidence": 0.978 + }, + { + "text": "CFT's", + "start": 112.86, + "end": 112.88, + "confidence": 0.978 + }, + { + "text": "CFT's", + "start": 112.88, + "end": 113.2, + "confidence": 0.979 + }, + { + "text": "CFT's", + "start": 113.2, + "end": 113.22, + "confidence": 0.978 + }, + { + "text": "CFT's", + "start": 113.22, + "end": 113.24, + "confidence": 0.978 + }, + { + "text": "CFT's", + "start": 113.24, + "end": 113.26, + "confidence": 0.977 + }, + { + "text": "CFT's", + "start": 113.26, + "end": 114.64, + "confidence": 0.979 + }, + { + "text": "CFT's", + "start": 114.64, + "end": 114.66, + "confidence": 0.977 + }, + { + "text": "CFT's", + "start": 114.66, + "end": 115.04, + "confidence": 0.977 + }, + { + "text": "CFT's", + "start": 115.04, + "end": 115.86, + "confidence": 0.975 + }, + { + "text": "CFT's", + "start": 115.86, + "end": 116.02, + "confidence": 0.976 + }, + { + "text": "CFT's", + "start": 116.02, + "end": 118.04, + "confidence": 0.976 + }, + { + "text": "CFT's", + "start": 118.04, + "end": 118.24, + "confidence": 0.976 + }, + { + "text": "CFT's", + "start": 118.24, + "end": 120.92, + "confidence": 0.975 + }, + { + "text": "CFT's", + "start": 120.92, + "end": 120.94, + "confidence": 0.974 + }, + { + "text": "CFT's", + "start": 120.94, + "end": 121.06, + "confidence": 0.976 + }, + { + "text": "CFT's", + "start": 121.06, + "end": 121.08, + "confidence": 0.975 + }, + { + "text": "CFT's", + "start": 121.08, + "end": 121.1, + "confidence": 0.973 + }, + { + "text": "CFT's", + "start": 121.1, + "end": 122.26, + "confidence": 0.975 + }, + { + "text": "CFT's", + "start": 122.26, + "end": 122.28, + "confidence": 0.974 + }, + { + "text": "CFT's", + "start": 122.28, + "end": 122.3, + "confidence": 0.974 + }, + { + "text": "CFT's", + "start": 122.3, + "end": 122.32, + "confidence": 0.976 + }, + { + "text": "CFT's", + "start": 122.32, + "end": 122.34, + "confidence": 0.975 + }, + { + "text": "CFT's", + "start": 122.34, + "end": 122.36, + "confidence": 0.975 + }, + { + "text": "CFT's", + "start": 122.36, + "end": 122.38, + "confidence": 0.975 + }, + { + "text": "CFT's", + "start": 122.38, + "end": 122.4, + "confidence": 0.975 + }, + { + "text": "CFT's", + "start": 122.4, + "end": 122.56, + "confidence": 0.973 + }, + { + "text": "CFT's", + "start": 122.56, + "end": 126.98, + "confidence": 0.972 + }, + { + "text": "C", + "start": 126.98, + "end": 127.0, + "confidence": 0.992 + } + ] + } + ], + "language": "en", + "language_probs": { + "en": 0.6579782962799072, + "zh": 0.05073783919215202, + "de": 0.003372770268470049, + "es": 0.008955760858952999, + "ru": 0.014423510059714317, + "ko": 0.011957507580518723, + "fr": 0.009168140590190887, + "ja": 0.05153684318065643, + "pt": 0.01365590374916792, + "tr": 0.0036184543278068304, + "pl": 0.002318068640306592, + "ca": 0.00034455020795576274, + "nl": 0.005965822376310825, + "ar": 0.0007181041873991489, + "sv": 0.0017634937539696693, + "it": 0.0032183199655264616, + "id": 0.0022643706761300564, + "hi": 0.00909679289907217, + "fi": 0.0007069710409268737, + "vi": 0.010470344685018063, + "he": 0.00012430129572749138, + "uk": 0.0007886832463555038, + "el": 0.00020413922902662307, + "ms": 0.004610029980540276, + "cs": 0.0006798874237574637, + "ro": 0.00173615338280797, + "da": 0.00031127515831030905, + "hu": 0.0025064300280064344, + "ta": 0.008955760858952999, + "no": 0.0006094471318647265, + "th": 0.0027100970037281513, + "ur": 0.000907768786419183, + "hr": 0.0001365182688459754, + "bg": 0.0006960105383768678, + "lt": 3.660014772322029e-05, + "la": 0.007720347959548235, + "mi": 0.0006487531354650855, + "ml": 0.00268900697119534, + "cy": 0.002318068640306592, + "sk": 0.00011953939247177914, + "te": 0.0032946402207016945, + "fa": 0.0002017609222093597, + "lv": 4.278990672901273e-05, + "bn": 0.00012975878780707717, + "sr": 4.4148200686322525e-05, + "az": 1.3783741451334208e-05, + "sl": 0.00034997606417164207, + "kn": 0.00013866812514606863, + "et": 4.329430157667957e-05, + "mk": 2.1017694962210953e-05, + "br": 0.0018194729927927256, + "eu": 0.0001441920321667567, + "is": 5.2222891099518165e-05, + "hy": 4.554961560643278e-05, + "ne": 0.00013975570618640631, + "mn": 0.0001553009351482615, + "bs": 0.00010715441749198362, + "kk": 5.928312930336688e-06, + "sq": 5.141325164004229e-05, + "sw": 6.0816717450506985e-05, + "gl": 0.000690594082698226, + "mr": 0.0001006622624117881, + "pa": 7.110193837434053e-05, + "si": 0.0003137165040243417, + "km": 0.0006693467148579657, + "sn": 0.00011273637937847525, + "yo": 0.0001277470582863316, + "so": 2.5547203676978825e-06, + "af": 5.8031713706441224e-05, + "oc": 4.2291387217119336e-05, + "ka": 1.008440085570328e-05, + "be": 2.5352179363835603e-05, + "tg": 1.1112863518292215e-07, + "sd": 0.00013812750694341958, + "gu": 0.0001318021968472749, + "am": 8.198559044103604e-06, + "yi": 5.848686851095408e-05, + "lo": 8.558519766665995e-06, + "uz": 2.218585981594856e-09, + "fo": 0.00011722728959284723, + "ht": 3.896065027220175e-05, + "ps": 1.9667322703753598e-05, + "tk": 2.7027908799936995e-08, + "nn": 0.04045173153281212, + "mt": 1.362315560982097e-05, + "sa": 0.00033394951606169343, + "lb": 7.04052212086026e-08, + "my": 0.00013231804769020528, + "bo": 7.480583735741675e-05, + "tl": 0.0008395488257519901, + "mg": 2.9800533596358036e-08, + "as": 1.531692578282673e-05, + "tt": 9.253462707192739e-08, + "haw": 0.04076899588108063, + "ln": 6.850153113191482e-06, + "ha": 5.209765774338848e-08, + "ba": 2.150648192866811e-08, + "jw": 0.006974753458052874, + "su": 8.510132687433725e-08 + } +} \ No newline at end of file diff --git a/tests/expected/tiny_auto/smartphone.mp3.words.json b/tests/expected/tiny_auto/smartphone.mp3.words.json new file mode 100644 index 0000000000000000000000000000000000000000..94c4ca676fbb4401dd2052668ed22176a027ace8 --- /dev/null +++ b/tests/expected/tiny_auto/smartphone.mp3.words.json @@ -0,0 +1,5192 @@ +{ + "text": " C'est évidence que dit Nicolas, mais je me l'étais jamais formulé comme ça. Ce qui fait la force du smartphone, c'est pas seulement la cumulation des fonctions, mais la manière dans quelques interagues entraîne. Et il est d'ailleurs, c'est la photo c'est hyper convaincant. Alors évidemment, il faudrait ajouter les interfaces les grand-attachilles à été beaucoup très souvent mentionnées. Mais bon, il faudrait que les profites aussi de 20 ans pendant l'été, les ordinateurs nous ont appris à piquer sur des icônes, sauf que, alors le smartphone ajoute le toucher, qui rend le contact plus direct, plus sensible. Et puis, évidemment, il faudrait parler aussi des applications qui permettent de contourner le côté tout flu de la navigation web pour aller directement en but. Bref, tout ça, ce sont les conditions qui permettent de créer cette objet, en Nicolas, dit qu'il est très symbolablement inédit dans l'histoire de l'humanité. Mais ça s'assoulait d'une autre interrogation. Est-ce que le fait que cette objet soit inédit un d'huits que notre rapport a lui est aussi un rapport inédit ? Est-ce que le rapport qu'on a au sein de foi n'est comparable à celui qu'on entretenait à d'autres objectes techniques comme la voiture ou le téléphone ? Il n'y a pas d'équivalent. On s'est espèrent de nous voter dans la relation à l'objet. C'est facilement éterricion. Parce que la passion de l'utilisateur et ses affices a dépendance, cette objet d'un lieu en fait, une espèce de relation de médiation avec le monde qui rendent encore avec la maille de celles formes de rogeur. Donc, à objets inédits, rapport inédits. Et, ce rapport, si j'en prends Nicolas, frère caractérisée par un mélange de dépendance et de rogeur. Bon, en vrai, il faudrait remonter très, très filmant tout l'histoire des objectes techniques et de leur infertion dans nos vieux pour déterminer si ce rapport est totalement inédit. Mais j'ai l'impression comme ça que Nicolas se trompe pas vraiment. Pour autant, je sache. Il y a eu plein de discussions autour de la voiture ou même du téléphone. Mais, la dépense n'était pas du même mort, donc le rejet n'en plus n'était pas du même mort. On peut adorer sa bagnure. On a par besoin pour plein de choses. Et là, le soir, quand on va se coucher, on la laisse. On la pade en la main quand on est colis, qu'on n'a même pas au chiot. On pouvait être émervé par son mome qui occupeait la ligne de téléphone pendant une heure chaque soir pour discuter avec un copain. Mais ça ne ressemble pas à ce qu'on peut ressentir à voir même mome aujourd'hui. Continuellement avec son smartphone dans la main, comme c'était une sorte de estimateur extère de tomber de lâcher à l'éantrénée, ça m'a eu immédiate. Bon, je dis ça pour le mome, mais évidemment, va là, bon aussi. Donc, rapport immédiate d'accord. Mais pourquoi, à ton impression qu'on en sortira, j'amé? Et puis, il faut en remettre la faute sur les gens qui ont créé cette critique merveilleux et diabolique et diabolique par que merveilleux. Les économistes parlent de dépendance du santé. Ces vidéos, en fait, on est un santé qui a été étabis, un soit mon termine, en marchand dessus, soit des finissants débordes, des finissants, une signalétique.", + "segments": [ + { + "id": 0, + "seek": 0, + "start": 0.42, + "end": 3.66, + "text": " C'est évidence que dit Nicolas, mais je me l'étais jamais formulé comme ça.", + "tokens": [ + 50364, + 383, + 6, + 377, + 20090, + 2778, + 631, + 6176, + 38268, + 11, + 2420, + 1506, + 385, + 287, + 6, + 22824, + 14540, + 49990, + 526, + 5173, + 2788, + 13, + 50545 + ], + "temperature": 0.0, + "avg_logprob": -0.5389881480823864, + "compression_ratio": 1.6505681818181819, + "no_speech_prob": 0.14073368906974792, + "confidence": 0.709, + "words": [ + { + "text": "C'est", + "start": 0.42, + "end": 0.68, + "confidence": 0.849 + }, + { + "text": "évidence", + "start": 0.68, + "end": 0.94, + "confidence": 0.368 + }, + { + "text": "que", + "start": 0.94, + "end": 1.08, + "confidence": 0.883 + }, + { + "text": "dit", + "start": 1.08, + "end": 1.2, + "confidence": 0.343 + }, + { + "text": "Nicolas,", + "start": 1.2, + "end": 1.44, + "confidence": 0.921 + }, + { + "text": "mais", + "start": 1.88, + "end": 2.14, + "confidence": 0.914 + }, + { + "text": "je", + "start": 2.14, + "end": 2.26, + "confidence": 0.778 + }, + { + "text": "me", + "start": 2.26, + "end": 2.34, + "confidence": 0.954 + }, + { + "text": "l'étais", + "start": 2.34, + "end": 2.58, + "confidence": 0.72 + }, + { + "text": "jamais", + "start": 2.58, + "end": 2.86, + "confidence": 0.946 + }, + { + "text": "formulé", + "start": 2.86, + "end": 3.26, + "confidence": 0.53 + }, + { + "text": "comme", + "start": 3.26, + "end": 3.46, + "confidence": 0.968 + }, + { + "text": "ça.", + "start": 3.46, + "end": 3.66, + "confidence": 0.96 + } + ] + }, + { + "id": 1, + "seek": 0, + "start": 4.14, + "end": 8.9, + "text": " Ce qui fait la force du smartphone, c'est pas seulement la cumulation des fonctions, mais la manière", + "tokens": [ + 50545, + 8257, + 1956, + 3887, + 635, + 3464, + 1581, + 13307, + 11, + 269, + 6, + 377, + 1736, + 27772, + 635, + 12713, + 2776, + 730, + 17290, + 3916, + 11, + 2420, + 635, + 22267, + 50806 + ], + "temperature": 0.0, + "avg_logprob": -0.5389881480823864, + "compression_ratio": 1.6505681818181819, + "no_speech_prob": 0.14073368906974792, + "confidence": 0.789, + "words": [ + { + "text": "Ce", + "start": 4.14, + "end": 4.26, + "confidence": 0.392 + }, + { + "text": "qui", + "start": 4.26, + "end": 4.38, + "confidence": 0.94 + }, + { + "text": "fait", + "start": 4.38, + "end": 4.56, + "confidence": 0.732 + }, + { + "text": "la", + "start": 4.56, + "end": 4.72, + "confidence": 0.988 + }, + { + "text": "force", + "start": 4.72, + "end": 5.02, + "confidence": 0.93 + }, + { + "text": "du", + "start": 5.02, + "end": 5.2, + "confidence": 0.938 + }, + { + "text": "smartphone,", + "start": 5.2, + "end": 5.58, + "confidence": 0.909 + }, + { + "text": "c'est", + "start": 5.9, + "end": 6.2, + "confidence": 0.947 + }, + { + "text": "pas", + "start": 6.2, + "end": 6.26, + "confidence": 0.983 + }, + { + "text": "seulement", + "start": 6.26, + "end": 6.6, + "confidence": 0.993 + }, + { + "text": "la", + "start": 6.6, + "end": 6.8, + "confidence": 0.633 + }, + { + "text": "cumulation", + "start": 6.8, + "end": 7.34, + "confidence": 0.689 + }, + { + "text": "des", + "start": 7.34, + "end": 7.56, + "confidence": 0.792 + }, + { + "text": "fonctions,", + "start": 7.56, + "end": 8.14, + "confidence": 0.834 + }, + { + "text": "mais", + "start": 8.38, + "end": 8.5, + "confidence": 0.668 + }, + { + "text": "la", + "start": 8.5, + "end": 8.62, + "confidence": 0.719 + }, + { + "text": "manière", + "start": 8.62, + "end": 8.9, + "confidence": 0.498 + } + ] + }, + { + "id": 2, + "seek": 0, + "start": 8.9, + "end": 10.98, + "text": " dans quelques interagues entraîne.", + "tokens": [ + 50806, + 2680, + 16597, + 728, + 559, + 1247, + 22284, + 24741, + 13, + 50906 + ], + "temperature": 0.0, + "avg_logprob": -0.5389881480823864, + "compression_ratio": 1.6505681818181819, + "no_speech_prob": 0.14073368906974792, + "confidence": 0.303, + "words": [ + { + "text": "dans", + "start": 8.9, + "end": 9.06, + "confidence": 0.284 + }, + { + "text": "quelques", + "start": 9.06, + "end": 9.28, + "confidence": 0.281 + }, + { + "text": "interagues", + "start": 9.28, + "end": 10.38, + "confidence": 0.246 + }, + { + "text": "entraîne.", + "start": 10.38, + "end": 10.98, + "confidence": 0.446 + } + ] + }, + { + "id": 3, + "seek": 0, + "start": 11.0, + "end": 12.96, + "text": " Et il est d'ailleurs, c'est la photo c'est hyper convaincant.", + "tokens": [ + 50906, + 3790, + 1930, + 871, + 274, + 6, + 19400, + 11, + 269, + 6, + 377, + 635, + 5052, + 269, + 6, + 377, + 9848, + 3754, + 491, + 66, + 394, + 13, + 51006 + ], + "temperature": 0.0, + "avg_logprob": -0.5389881480823864, + "compression_ratio": 1.6505681818181819, + "no_speech_prob": 0.14073368906974792, + "confidence": 0.63, + "words": [ + { + "text": "Et", + "start": 11.0, + "end": 11.12, + "confidence": 0.36 + }, + { + "text": "il", + "start": 11.12, + "end": 11.28, + "confidence": 0.144 + }, + { + "text": "est", + "start": 11.28, + "end": 11.38, + "confidence": 0.241 + }, + { + "text": "d'ailleurs,", + "start": 11.38, + "end": 11.6, + "confidence": 0.904 + }, + { + "text": "c'est", + "start": 11.7, + "end": 11.78, + "confidence": 0.886 + }, + { + "text": "la", + "start": 11.78, + "end": 11.8, + "confidence": 0.969 + }, + { + "text": "photo", + "start": 11.8, + "end": 12.02, + "confidence": 0.809 + }, + { + "text": "c'est", + "start": 12.02, + "end": 12.26, + "confidence": 0.785 + }, + { + "text": "hyper", + "start": 12.26, + "end": 12.46, + "confidence": 0.938 + }, + { + "text": "convaincant.", + "start": 12.46, + "end": 12.96, + "confidence": 0.51 + } + ] + }, + { + "id": 4, + "seek": 0, + "start": 13.3, + "end": 18.8, + "text": " Alors évidemment, il faudrait ajouter les interfaces les grand-attachilles à été beaucoup très souvent", + "tokens": [ + 51006, + 9946, + 24724, + 11, + 1930, + 38694, + 8645, + 17680, + 23985, + 1512, + 28416, + 1512, + 2697, + 12, + 1591, + 608, + 14835, + 1531, + 8862, + 8796, + 5732, + 20847, + 51306 + ], + "temperature": 0.0, + "avg_logprob": -0.5389881480823864, + "compression_ratio": 1.6505681818181819, + "no_speech_prob": 0.14073368906974792, + "confidence": 0.532, + "words": [ + { + "text": "Alors", + "start": 13.3, + "end": 13.56, + "confidence": 0.894 + }, + { + "text": "évidemment,", + "start": 13.56, + "end": 13.82, + "confidence": 0.778 + }, + { + "text": "il", + "start": 14.38, + "end": 14.4, + "confidence": 0.964 + }, + { + "text": "faudrait", + "start": 14.4, + "end": 14.76, + "confidence": 0.856 + }, + { + "text": "ajouter", + "start": 14.76, + "end": 15.38, + "confidence": 0.883 + }, + { + "text": "les", + "start": 15.38, + "end": 15.6, + "confidence": 0.934 + }, + { + "text": "interfaces", + "start": 15.6, + "end": 16.0, + "confidence": 0.38 + }, + { + "text": "les", + "start": 16.0, + "end": 16.5, + "confidence": 0.463 + }, + { + "text": "grand-attachilles", + "start": 16.5, + "end": 17.16, + "confidence": 0.213 + }, + { + "text": "à", + "start": 17.16, + "end": 17.32, + "confidence": 0.406 + }, + { + "text": "été", + "start": 17.32, + "end": 17.72, + "confidence": 0.894 + }, + { + "text": "beaucoup", + "start": 17.72, + "end": 18.28, + "confidence": 0.797 + }, + { + "text": "très", + "start": 18.28, + "end": 18.64, + "confidence": 0.493 + }, + { + "text": "souvent", + "start": 18.64, + "end": 18.8, + "confidence": 0.822 + } + ] + }, + { + "id": 5, + "seek": 0, + "start": 18.8, + "end": 19.84, + "text": " mentionnées.", + "tokens": [ + 51306, + 2152, + 77, + 6836, + 13, + 51356 + ], + "temperature": 0.0, + "avg_logprob": -0.5389881480823864, + "compression_ratio": 1.6505681818181819, + "no_speech_prob": 0.14073368906974792, + "confidence": 0.626, + "words": [ + { + "text": "mentionnées.", + "start": 18.8, + "end": 19.84, + "confidence": 0.626 + } + ] + }, + { + "id": 6, + "seek": 0, + "start": 20.02, + "end": 23.58, + "text": " Mais bon, il faudrait que les profites aussi de 20 ans pendant l'été, les ordinateurs", + "tokens": [ + 51356, + 6313, + 4428, + 11, + 1930, + 38694, + 8645, + 631, + 1512, + 1740, + 3324, + 6212, + 368, + 945, + 1567, + 17338, + 287, + 6, + 21210, + 11, + 1512, + 4792, + 13923, + 2156, + 51543 + ], + "temperature": 0.0, + "avg_logprob": -0.5389881480823864, + "compression_ratio": 1.6505681818181819, + "no_speech_prob": 0.14073368906974792, + "confidence": 0.658, + "words": [ + { + "text": "Mais", + "start": 20.02, + "end": 20.26, + "confidence": 0.98 + }, + { + "text": "bon,", + "start": 20.26, + "end": 20.46, + "confidence": 0.568 + }, + { + "text": "il", + "start": 20.6, + "end": 20.68, + "confidence": 0.975 + }, + { + "text": "faudrait", + "start": 20.68, + "end": 20.78, + "confidence": 0.771 + }, + { + "text": "que", + "start": 20.78, + "end": 20.92, + "confidence": 0.388 + }, + { + "text": "les", + "start": 20.92, + "end": 20.96, + "confidence": 0.22 + }, + { + "text": "profites", + "start": 20.96, + "end": 21.36, + "confidence": 0.57 + }, + { + "text": "aussi", + "start": 21.36, + "end": 21.72, + "confidence": 0.52 + }, + { + "text": "de", + "start": 21.72, + "end": 21.92, + "confidence": 0.492 + }, + { + "text": "20", + "start": 21.92, + "end": 22.14, + "confidence": 0.915 + }, + { + "text": "ans", + "start": 22.14, + "end": 22.32, + "confidence": 0.942 + }, + { + "text": "pendant", + "start": 22.32, + "end": 22.52, + "confidence": 0.916 + }, + { + "text": "l'été,", + "start": 22.52, + "end": 22.86, + "confidence": 0.48 + }, + { + "text": "les", + "start": 22.98, + "end": 23.1, + "confidence": 0.903 + }, + { + "text": "ordinateurs", + "start": 23.1, + "end": 23.58, + "confidence": 0.946 + } + ] + }, + { + "id": 7, + "seek": 0, + "start": 23.58, + "end": 28.07, + "text": " nous ont appris à piquer sur des icônes, sauf que, alors le smartphone ajoute le toucher,", + "tokens": [ + 51543, + 4666, + 6592, + 724, + 5714, + 1531, + 280, + 23909, + 1022, + 730, + 4376, + 2851, + 4081, + 11, + 601, + 2947, + 631, + 11, + 11246, + 476, + 13307, + 17680, + 14040, + 476, + 2557, + 260, + 11, + 51766 + ], + "temperature": 0.0, + "avg_logprob": -0.5389881480823864, + "compression_ratio": 1.6505681818181819, + "no_speech_prob": 0.14073368906974792, + "confidence": 0.656, + "words": [ + { + "text": "nous", + "start": 23.58, + "end": 23.78, + "confidence": 0.767 + }, + { + "text": "ont", + "start": 23.78, + "end": 23.9, + "confidence": 0.98 + }, + { + "text": "appris", + "start": 23.9, + "end": 24.12, + "confidence": 0.952 + }, + { + "text": "à", + "start": 24.12, + "end": 24.26, + "confidence": 0.34 + }, + { + "text": "piquer", + "start": 24.26, + "end": 24.54, + "confidence": 0.449 + }, + { + "text": "sur", + "start": 24.54, + "end": 24.72, + "confidence": 0.816 + }, + { + "text": "des", + "start": 24.72, + "end": 24.9, + "confidence": 0.96 + }, + { + "text": "icônes,", + "start": 24.9, + "end": 25.56, + "confidence": 0.599 + }, + { + "text": "sauf", + "start": 25.64, + "end": 25.8, + "confidence": 0.522 + }, + { + "text": "que,", + "start": 25.8, + "end": 26.36, + "confidence": 0.915 + }, + { + "text": "alors", + "start": 26.36, + "end": 26.58, + "confidence": 0.396 + }, + { + "text": "le", + "start": 26.58, + "end": 26.72, + "confidence": 0.824 + }, + { + "text": "smartphone", + "start": 26.72, + "end": 27.0, + "confidence": 0.977 + }, + { + "text": "ajoute", + "start": 27.0, + "end": 27.5, + "confidence": 0.674 + }, + { + "text": "le", + "start": 27.5, + "end": 27.62, + "confidence": 0.552 + }, + { + "text": "toucher,", + "start": 27.62, + "end": 28.07, + "confidence": 0.631 + } + ] + }, + { + "id": 8, + "seek": 2804, + "start": 28.07, + "end": 30.6, + "text": " qui rend le contact plus direct, plus sensible.", + "tokens": [ + 50364, + 1956, + 6125, + 476, + 3385, + 1804, + 2047, + 11, + 1804, + 25380, + 13, + 50496 + ], + "temperature": 0.0, + "avg_logprob": -0.4256427271836469, + "compression_ratio": 1.7156549520766773, + "no_speech_prob": 0.12921307981014252, + "confidence": 0.742, + "words": [ + { + "text": "qui", + "start": 28.07, + "end": 28.26, + "confidence": 0.305 + }, + { + "text": "rend", + "start": 28.26, + "end": 28.5, + "confidence": 0.763 + }, + { + "text": "le", + "start": 28.5, + "end": 28.72, + "confidence": 0.988 + }, + { + "text": "contact", + "start": 28.72, + "end": 29.06, + "confidence": 0.817 + }, + { + "text": "plus", + "start": 29.06, + "end": 29.48, + "confidence": 0.84 + }, + { + "text": "direct,", + "start": 29.48, + "end": 30.02, + "confidence": 0.944 + }, + { + "text": "plus", + "start": 30.18, + "end": 30.24, + "confidence": 0.992 + }, + { + "text": "sensible.", + "start": 30.24, + "end": 30.6, + "confidence": 0.618 + } + ] + }, + { + "id": 9, + "seek": 2804, + "start": 31.1, + "end": 34.76, + "text": " Et puis, évidemment, il faudrait parler aussi des applications qui permettent de contourner le côté", + "tokens": [ + 50496, + 3790, + 9093, + 11, + 24724, + 11, + 1930, + 38694, + 8645, + 16421, + 6212, + 730, + 5821, + 1956, + 21540, + 317, + 368, + 21234, + 1193, + 476, + 18437, + 50698 + ], + "temperature": 0.0, + "avg_logprob": -0.4256427271836469, + "compression_ratio": 1.7156549520766773, + "no_speech_prob": 0.12921307981014252, + "confidence": 0.777, + "words": [ + { + "text": "Et", + "start": 31.1, + "end": 31.24, + "confidence": 0.949 + }, + { + "text": "puis,", + "start": 31.24, + "end": 31.36, + "confidence": 0.721 + }, + { + "text": "évidemment,", + "start": 31.42, + "end": 31.62, + "confidence": 0.213 + }, + { + "text": "il", + "start": 31.7, + "end": 31.76, + "confidence": 0.959 + }, + { + "text": "faudrait", + "start": 31.76, + "end": 31.94, + "confidence": 0.994 + }, + { + "text": "parler", + "start": 31.94, + "end": 32.14, + "confidence": 0.847 + }, + { + "text": "aussi", + "start": 32.14, + "end": 32.36, + "confidence": 0.925 + }, + { + "text": "des", + "start": 32.36, + "end": 32.46, + "confidence": 0.921 + }, + { + "text": "applications", + "start": 32.46, + "end": 32.88, + "confidence": 0.857 + }, + { + "text": "qui", + "start": 32.88, + "end": 33.2, + "confidence": 0.663 + }, + { + "text": "permettent", + "start": 33.2, + "end": 33.8, + "confidence": 0.952 + }, + { + "text": "de", + "start": 33.8, + "end": 33.96, + "confidence": 0.951 + }, + { + "text": "contourner", + "start": 33.96, + "end": 34.4, + "confidence": 0.721 + }, + { + "text": "le", + "start": 34.4, + "end": 34.52, + "confidence": 0.654 + }, + { + "text": "côté", + "start": 34.52, + "end": 34.76, + "confidence": 0.641 + } + ] + }, + { + "id": 10, + "seek": 2804, + "start": 34.8, + "end": 37.86, + "text": " tout flu de la navigation web pour aller directement en but.", + "tokens": [ + 50698, + 3486, + 5029, + 368, + 635, + 17346, + 3670, + 2016, + 8722, + 37297, + 465, + 457, + 13, + 50860 + ], + "temperature": 0.0, + "avg_logprob": -0.4256427271836469, + "compression_ratio": 1.7156549520766773, + "no_speech_prob": 0.12921307981014252, + "confidence": 0.735, + "words": [ + { + "text": "tout", + "start": 34.8, + "end": 35.04, + "confidence": 0.945 + }, + { + "text": "flu", + "start": 35.04, + "end": 35.32, + "confidence": 0.484 + }, + { + "text": "de", + "start": 35.32, + "end": 35.64, + "confidence": 0.35 + }, + { + "text": "la", + "start": 35.64, + "end": 35.78, + "confidence": 0.921 + }, + { + "text": "navigation", + "start": 35.78, + "end": 36.24, + "confidence": 0.903 + }, + { + "text": "web", + "start": 36.24, + "end": 36.64, + "confidence": 0.913 + }, + { + "text": "pour", + "start": 36.64, + "end": 36.84, + "confidence": 0.57 + }, + { + "text": "aller", + "start": 36.84, + "end": 37.06, + "confidence": 0.991 + }, + { + "text": "directement", + "start": 37.06, + "end": 37.48, + "confidence": 0.981 + }, + { + "text": "en", + "start": 37.48, + "end": 37.7, + "confidence": 0.654 + }, + { + "text": "but.", + "start": 37.7, + "end": 37.86, + "confidence": 0.768 + } + ] + }, + { + "id": 11, + "seek": 2804, + "start": 38.78, + "end": 43.12, + "text": " Bref, tout ça, ce sont les conditions qui permettent de créer cette objet, en Nicolas,", + "tokens": [ + 50860, + 49957, + 11, + 3486, + 2788, + 11, + 1769, + 4900, + 1512, + 4487, + 1956, + 21540, + 317, + 368, + 32062, + 5550, + 14964, + 11, + 465, + 38268, + 11, + 51121 + ], + "temperature": 0.0, + "avg_logprob": -0.4256427271836469, + "compression_ratio": 1.7156549520766773, + "no_speech_prob": 0.12921307981014252, + "confidence": 0.737, + "words": [ + { + "text": "Bref,", + "start": 38.78, + "end": 38.8, + "confidence": 0.972 + }, + { + "text": "tout", + "start": 38.84, + "end": 39.04, + "confidence": 0.817 + }, + { + "text": "ça,", + "start": 39.04, + "end": 39.46, + "confidence": 0.984 + }, + { + "text": "ce", + "start": 39.54, + "end": 39.76, + "confidence": 0.905 + }, + { + "text": "sont", + "start": 39.76, + "end": 39.96, + "confidence": 0.98 + }, + { + "text": "les", + "start": 39.96, + "end": 40.1, + "confidence": 0.982 + }, + { + "text": "conditions", + "start": 40.1, + "end": 40.64, + "confidence": 0.956 + }, + { + "text": "qui", + "start": 40.64, + "end": 40.96, + "confidence": 0.995 + }, + { + "text": "permettent", + "start": 40.96, + "end": 41.58, + "confidence": 0.994 + }, + { + "text": "de", + "start": 41.58, + "end": 41.64, + "confidence": 0.993 + }, + { + "text": "créer", + "start": 41.64, + "end": 42.08, + "confidence": 0.91 + }, + { + "text": "cette", + "start": 42.08, + "end": 42.34, + "confidence": 0.473 + }, + { + "text": "objet,", + "start": 42.34, + "end": 42.64, + "confidence": 0.235 + }, + { + "text": "en", + "start": 42.7, + "end": 42.84, + "confidence": 0.221 + }, + { + "text": "Nicolas,", + "start": 42.84, + "end": 43.12, + "confidence": 0.537 + } + ] + }, + { + "id": 12, + "seek": 2804, + "start": 43.12, + "end": 46.58, + "text": " dit qu'il est très symbolablement inédit dans l'histoire de l'humanité.", + "tokens": [ + 51121, + 6176, + 421, + 6, + 388, + 871, + 5732, + 5986, + 712, + 518, + 294, + 7811, + 270, + 2680, + 287, + 6, + 29093, + 368, + 287, + 6, + 18796, + 5066, + 13, + 51290 + ], + "temperature": 0.0, + "avg_logprob": -0.4256427271836469, + "compression_ratio": 1.7156549520766773, + "no_speech_prob": 0.12921307981014252, + "confidence": 0.717, + "words": [ + { + "text": "dit", + "start": 43.12, + "end": 43.56, + "confidence": 0.696 + }, + { + "text": "qu'il", + "start": 43.56, + "end": 43.76, + "confidence": 0.958 + }, + { + "text": "est", + "start": 43.76, + "end": 43.9, + "confidence": 0.849 + }, + { + "text": "très", + "start": 43.9, + "end": 44.08, + "confidence": 0.443 + }, + { + "text": "symbolablement", + "start": 44.08, + "end": 44.86, + "confidence": 0.321 + }, + { + "text": "inédit", + "start": 44.86, + "end": 45.54, + "confidence": 0.655 + }, + { + "text": "dans", + "start": 45.54, + "end": 45.74, + "confidence": 0.817 + }, + { + "text": "l'histoire", + "start": 45.74, + "end": 46.02, + "confidence": 0.824 + }, + { + "text": "de", + "start": 46.02, + "end": 46.14, + "confidence": 0.983 + }, + { + "text": "l'humanité.", + "start": 46.14, + "end": 46.58, + "confidence": 0.99 + } + ] + }, + { + "id": 13, + "seek": 2804, + "start": 47.06, + "end": 48.76, + "text": " Mais ça s'assoulait d'une autre interrogation.", + "tokens": [ + 51290, + 6313, + 2788, + 262, + 6, + 640, + 263, + 35235, + 274, + 6, + 2613, + 15081, + 24871, + 399, + 13, + 51402 + ], + "temperature": 0.0, + "avg_logprob": -0.4256427271836469, + "compression_ratio": 1.7156549520766773, + "no_speech_prob": 0.12921307981014252, + "confidence": 0.717, + "words": [ + { + "text": "Mais", + "start": 47.06, + "end": 47.24, + "confidence": 0.928 + }, + { + "text": "ça", + "start": 47.24, + "end": 47.48, + "confidence": 0.75 + }, + { + "text": "s'assoulait", + "start": 47.48, + "end": 47.84, + "confidence": 0.616 + }, + { + "text": "d'une", + "start": 47.84, + "end": 48.08, + "confidence": 0.674 + }, + { + "text": "autre", + "start": 48.08, + "end": 48.18, + "confidence": 0.964 + }, + { + "text": "interrogation.", + "start": 48.18, + "end": 48.76, + "confidence": 0.855 + } + ] + }, + { + "id": 14, + "seek": 2804, + "start": 49.42, + "end": 54.93, + "text": " Est-ce que le fait que cette objet soit inédit un d'huits que notre rapport a lui est aussi un rapport", + "tokens": [ + 51402, + 4410, + 12, + 384, + 631, + 476, + 3887, + 631, + 5550, + 14964, + 12703, + 294, + 7811, + 270, + 517, + 274, + 6, + 12086, + 1208, + 631, + 10349, + 18018, + 257, + 8783, + 871, + 6212, + 517, + 18018, + 51710 + ], + "temperature": 0.0, + "avg_logprob": -0.4256427271836469, + "compression_ratio": 1.7156549520766773, + "no_speech_prob": 0.12921307981014252, + "confidence": 0.704, + "words": [ + { + "text": "Est-ce", + "start": 49.42, + "end": 49.7, + "confidence": 0.919 + }, + { + "text": "que", + "start": 49.7, + "end": 49.74, + "confidence": 0.99 + }, + { + "text": "le", + "start": 49.74, + "end": 49.82, + "confidence": 0.871 + }, + { + "text": "fait", + "start": 49.82, + "end": 50.02, + "confidence": 0.945 + }, + { + "text": "que", + "start": 50.02, + "end": 50.16, + "confidence": 0.923 + }, + { + "text": "cette", + "start": 50.16, + "end": 50.3, + "confidence": 0.943 + }, + { + "text": "objet", + "start": 50.3, + "end": 50.64, + "confidence": 0.963 + }, + { + "text": "soit", + "start": 50.64, + "end": 51.1, + "confidence": 0.99 + }, + { + "text": "inédit", + "start": 51.1, + "end": 51.82, + "confidence": 0.928 + }, + { + "text": "un", + "start": 51.82, + "end": 52.08, + "confidence": 0.511 + }, + { + "text": "d'huits", + "start": 52.08, + "end": 52.34, + "confidence": 0.246 + }, + { + "text": "que", + "start": 52.34, + "end": 52.44, + "confidence": 0.974 + }, + { + "text": "notre", + "start": 52.44, + "end": 52.66, + "confidence": 0.992 + }, + { + "text": "rapport", + "start": 52.66, + "end": 53.24, + "confidence": 0.779 + }, + { + "text": "a", + "start": 53.24, + "end": 53.5, + "confidence": 0.57 + }, + { + "text": "lui", + "start": 53.5, + "end": 53.7, + "confidence": 0.701 + }, + { + "text": "est", + "start": 53.7, + "end": 54.04, + "confidence": 0.879 + }, + { + "text": "aussi", + "start": 54.04, + "end": 54.52, + "confidence": 0.815 + }, + { + "text": "un", + "start": 54.52, + "end": 54.7, + "confidence": 0.48 + }, + { + "text": "rapport", + "start": 54.7, + "end": 54.93, + "confidence": 0.952 + } + ] + }, + { + "id": 15, + "seek": 2804, + "start": 54.93, + "end": 55.88, + "text": " inédit ?", + "tokens": [ + 51710, + 294, + 7811, + 270, + 2506, + 51760 + ], + "temperature": 0.0, + "avg_logprob": -0.4256427271836469, + "compression_ratio": 1.7156549520766773, + "no_speech_prob": 0.12921307981014252, + "confidence": 0.86, + "words": [ + { + "text": "inédit ?", + "start": 54.93, + "end": 55.88, + "confidence": 0.86 + } + ] + }, + { + "id": 16, + "seek": 5596, + "start": 55.96, + "end": 59.36, + "text": " Est-ce que le rapport qu'on a au sein de foi n'est comparable à celui qu'on entretenait", + "tokens": [ + 50364, + 4410, + 12, + 384, + 631, + 476, + 18018, + 421, + 6, + 266, + 257, + 1609, + 6195, + 368, + 6901, + 297, + 6, + 377, + 25323, + 1531, + 22829, + 421, + 6, + 266, + 3962, + 1147, + 1001, + 50530 + ], + "temperature": 0.0, + "avg_logprob": -0.6293370928083147, + "compression_ratio": 1.5749128919860627, + "no_speech_prob": 0.21948836743831635, + "confidence": 0.62, + "words": [ + { + "text": "Est-ce", + "start": 55.96, + "end": 56.38, + "confidence": 0.553 + }, + { + "text": "que", + "start": 56.38, + "end": 56.44, + "confidence": 0.892 + }, + { + "text": "le", + "start": 56.44, + "end": 56.58, + "confidence": 0.982 + }, + { + "text": "rapport", + "start": 56.58, + "end": 56.9, + "confidence": 0.999 + }, + { + "text": "qu'on", + "start": 56.9, + "end": 57.14, + "confidence": 0.902 + }, + { + "text": "a", + "start": 57.14, + "end": 57.2, + "confidence": 0.959 + }, + { + "text": "au", + "start": 57.2, + "end": 57.28, + "confidence": 0.273 + }, + { + "text": "sein", + "start": 57.28, + "end": 57.42, + "confidence": 0.17 + }, + { + "text": "de", + "start": 57.42, + "end": 57.56, + "confidence": 0.229 + }, + { + "text": "foi", + "start": 57.56, + "end": 57.58, + "confidence": 0.121 + }, + { + "text": "n'est", + "start": 57.58, + "end": 57.78, + "confidence": 0.79 + }, + { + "text": "comparable", + "start": 57.78, + "end": 58.28, + "confidence": 0.547 + }, + { + "text": "à", + "start": 58.28, + "end": 58.48, + "confidence": 0.934 + }, + { + "text": "celui", + "start": 58.48, + "end": 58.7, + "confidence": 0.851 + }, + { + "text": "qu'on", + "start": 58.7, + "end": 58.94, + "confidence": 0.926 + }, + { + "text": "entretenait", + "start": 58.94, + "end": 59.36, + "confidence": 0.56 + } + ] + }, + { + "id": 17, + "seek": 5596, + "start": 59.36, + "end": 63.14, + "text": " à d'autres objectes techniques comme la voiture ou le téléphone ?", + "tokens": [ + 50530, + 1531, + 274, + 6, + 16752, + 2657, + 279, + 7512, + 5173, + 635, + 38859, + 2820, + 476, + 47159, + 2506, + 50714 + ], + "temperature": 0.0, + "avg_logprob": -0.6293370928083147, + "compression_ratio": 1.5749128919860627, + "no_speech_prob": 0.21948836743831635, + "confidence": 0.756, + "words": [ + { + "text": "à", + "start": 59.36, + "end": 59.44, + "confidence": 0.951 + }, + { + "text": "d'autres", + "start": 59.44, + "end": 59.68, + "confidence": 0.857 + }, + { + "text": "objectes", + "start": 59.68, + "end": 60.02, + "confidence": 0.507 + }, + { + "text": "techniques", + "start": 60.02, + "end": 60.44, + "confidence": 0.462 + }, + { + "text": "comme", + "start": 60.44, + "end": 61.04, + "confidence": 0.639 + }, + { + "text": "la", + "start": 61.04, + "end": 61.52, + "confidence": 0.905 + }, + { + "text": "voiture", + "start": 61.52, + "end": 61.86, + "confidence": 0.946 + }, + { + "text": "ou", + "start": 61.86, + "end": 62.46, + "confidence": 0.755 + }, + { + "text": "le", + "start": 62.46, + "end": 62.68, + "confidence": 0.913 + }, + { + "text": "téléphone ?", + "start": 62.68, + "end": 63.14, + "confidence": 0.983 + } + ] + }, + { + "id": 18, + "seek": 5596, + "start": 65.4, + "end": 66.16, + "text": " Il n'y a pas d'équivalent.", + "tokens": [ + 50714, + 4416, + 297, + 6, + 88, + 257, + 1736, + 274, + 6, + 20183, + 3576, + 317, + 13, + 50872 + ], + "temperature": 0.0, + "avg_logprob": -0.6293370928083147, + "compression_ratio": 1.5749128919860627, + "no_speech_prob": 0.21948836743831635, + "confidence": 0.881, + "words": [ + { + "text": "Il", + "start": 65.4, + "end": 65.5, + "confidence": 0.901 + }, + { + "text": "n'y", + "start": 65.5, + "end": 65.54, + "confidence": 0.86 + }, + { + "text": "a", + "start": 65.54, + "end": 65.56, + "confidence": 0.962 + }, + { + "text": "pas", + "start": 65.56, + "end": 65.68, + "confidence": 0.998 + }, + { + "text": "d'équivalent.", + "start": 65.68, + "end": 66.16, + "confidence": 0.852 + } + ] + }, + { + "id": 19, + "seek": 5596, + "start": 66.16, + "end": 69.92, + "text": " On s'est espèrent de nous voter dans la relation à l'objet.", + "tokens": [ + 50872, + 1282, + 262, + 6, + 377, + 7089, + 1462, + 1753, + 368, + 4666, + 21722, + 2680, + 635, + 9721, + 1531, + 287, + 6, + 996, + 7108, + 13, + 51058 + ], + "temperature": 0.0, + "avg_logprob": -0.6293370928083147, + "compression_ratio": 1.5749128919860627, + "no_speech_prob": 0.21948836743831635, + "confidence": 0.501, + "words": [ + { + "text": "On", + "start": 66.16, + "end": 67.08, + "confidence": 0.302 + }, + { + "text": "s'est", + "start": 67.08, + "end": 67.3, + "confidence": 0.563 + }, + { + "text": "espèrent", + "start": 67.3, + "end": 67.62, + "confidence": 0.134 + }, + { + "text": "de", + "start": 67.62, + "end": 67.66, + "confidence": 0.99 + }, + { + "text": "nous", + "start": 67.66, + "end": 67.84, + "confidence": 0.763 + }, + { + "text": "voter", + "start": 67.84, + "end": 68.36, + "confidence": 0.181 + }, + { + "text": "dans", + "start": 68.36, + "end": 68.86, + "confidence": 0.82 + }, + { + "text": "la", + "start": 68.86, + "end": 68.96, + "confidence": 0.617 + }, + { + "text": "relation", + "start": 68.96, + "end": 69.24, + "confidence": 0.949 + }, + { + "text": "à", + "start": 69.24, + "end": 69.42, + "confidence": 0.75 + }, + { + "text": "l'objet.", + "start": 69.42, + "end": 69.92, + "confidence": 0.887 + } + ] + }, + { + "id": 20, + "seek": 5596, + "start": 70.2, + "end": 71.22, + "text": " C'est facilement éterricion.", + "tokens": [ + 51058, + 383, + 6, + 377, + 23670, + 518, + 1136, + 391, + 1341, + 313, + 13, + 51122 + ], + "temperature": 0.0, + "avg_logprob": -0.6293370928083147, + "compression_ratio": 1.5749128919860627, + "no_speech_prob": 0.21948836743831635, + "confidence": 0.441, + "words": [ + { + "text": "C'est", + "start": 70.2, + "end": 70.34, + "confidence": 0.895 + }, + { + "text": "facilement", + "start": 70.34, + "end": 70.7, + "confidence": 0.562 + }, + { + "text": "éterricion.", + "start": 70.7, + "end": 71.22, + "confidence": 0.23 + } + ] + }, + { + "id": 21, + "seek": 5596, + "start": 71.64, + "end": 76.97, + "text": " Parce que la passion de l'utilisateur et ses affices a dépendance, cette objet d'un lieu", + "tokens": [ + 51122, + 20429, + 631, + 635, + 5418, + 368, + 287, + 6, + 20835, + 271, + 15540, + 1030, + 5385, + 2096, + 1473, + 257, + 45768, + 719, + 11, + 5550, + 14964, + 274, + 6, + 409, + 26036, + 51416 + ], + "temperature": 0.0, + "avg_logprob": -0.6293370928083147, + "compression_ratio": 1.5749128919860627, + "no_speech_prob": 0.21948836743831635, + "confidence": 0.457, + "words": [ + { + "text": "Parce", + "start": 71.64, + "end": 71.94, + "confidence": 0.679 + }, + { + "text": "que", + "start": 71.94, + "end": 72.32, + "confidence": 0.566 + }, + { + "text": "la", + "start": 72.32, + "end": 72.56, + "confidence": 0.336 + }, + { + "text": "passion", + "start": 72.56, + "end": 72.9, + "confidence": 0.267 + }, + { + "text": "de", + "start": 72.9, + "end": 73.24, + "confidence": 0.365 + }, + { + "text": "l'utilisateur", + "start": 73.24, + "end": 74.82, + "confidence": 0.499 + }, + { + "text": "et", + "start": 74.82, + "end": 74.92, + "confidence": 0.45 + }, + { + "text": "ses", + "start": 74.92, + "end": 75.04, + "confidence": 0.095 + }, + { + "text": "affices", + "start": 75.04, + "end": 75.24, + "confidence": 0.303 + }, + { + "text": "a", + "start": 75.24, + "end": 75.38, + "confidence": 0.59 + }, + { + "text": "dépendance,", + "start": 75.38, + "end": 76.06, + "confidence": 0.559 + }, + { + "text": "cette", + "start": 76.32, + "end": 76.34, + "confidence": 0.401 + }, + { + "text": "objet", + "start": 76.34, + "end": 76.54, + "confidence": 0.924 + }, + { + "text": "d'un", + "start": 76.54, + "end": 76.92, + "confidence": 0.783 + }, + { + "text": "lieu", + "start": 76.92, + "end": 76.97, + "confidence": 0.307 + } + ] + }, + { + "id": 22, + "seek": 5596, + "start": 76.97, + "end": 82.15, + "text": " en fait, une espèce de relation de médiation avec le monde qui rendent encore avec", + "tokens": [ + 51416, + 465, + 3887, + 11, + 2251, + 7089, + 30236, + 368, + 9721, + 368, + 42436, + 399, + 4163, + 476, + 10431, + 1956, + 6125, + 317, + 10122, + 4163, + 51671 + ], + "temperature": 0.0, + "avg_logprob": -0.6293370928083147, + "compression_ratio": 1.5749128919860627, + "no_speech_prob": 0.21948836743831635, + "confidence": 0.746, + "words": [ + { + "text": "en", + "start": 76.97, + "end": 77.2, + "confidence": 0.767 + }, + { + "text": "fait,", + "start": 77.2, + "end": 77.32, + "confidence": 0.944 + }, + { + "text": "une", + "start": 77.46, + "end": 77.48, + "confidence": 0.696 + }, + { + "text": "espèce", + "start": 77.48, + "end": 77.9, + "confidence": 0.97 + }, + { + "text": "de", + "start": 77.9, + "end": 78.08, + "confidence": 0.994 + }, + { + "text": "relation", + "start": 78.08, + "end": 78.5, + "confidence": 0.826 + }, + { + "text": "de", + "start": 78.5, + "end": 78.94, + "confidence": 0.72 + }, + { + "text": "médiation", + "start": 78.94, + "end": 79.5, + "confidence": 0.881 + }, + { + "text": "avec", + "start": 79.5, + "end": 79.74, + "confidence": 0.968 + }, + { + "text": "le", + "start": 79.74, + "end": 79.94, + "confidence": 0.986 + }, + { + "text": "monde", + "start": 79.94, + "end": 80.44, + "confidence": 0.906 + }, + { + "text": "qui", + "start": 80.44, + "end": 81.14, + "confidence": 0.825 + }, + { + "text": "rendent", + "start": 81.14, + "end": 81.8, + "confidence": 0.584 + }, + { + "text": "encore", + "start": 81.8, + "end": 81.98, + "confidence": 0.198 + }, + { + "text": "avec", + "start": 81.98, + "end": 82.15, + "confidence": 0.486 + } + ] + }, + { + "id": 23, + "seek": 8210, + "start": 82.15, + "end": 83.44, + "text": " la maille de celles formes de rogeur.", + "tokens": [ + 50364, + 635, + 463, + 3409, + 368, + 2815, + 279, + 1254, + 279, + 368, + 744, + 432, + 374, + 13, + 50440 + ], + "temperature": 0.0, + "avg_logprob": -0.45904387403654573, + "compression_ratio": 1.6159169550173011, + "no_speech_prob": 0.2066797912120819, + "confidence": 0.465, + "words": [ + { + "text": "la", + "start": 82.15, + "end": 82.22, + "confidence": 0.648 + }, + { + "text": "maille", + "start": 82.22, + "end": 82.4, + "confidence": 0.136 + }, + { + "text": "de", + "start": 82.4, + "end": 82.48, + "confidence": 0.585 + }, + { + "text": "celles", + "start": 82.48, + "end": 82.74, + "confidence": 0.561 + }, + { + "text": "formes", + "start": 82.74, + "end": 82.96, + "confidence": 0.78 + }, + { + "text": "de", + "start": 82.96, + "end": 83.0, + "confidence": 0.936 + }, + { + "text": "rogeur.", + "start": 83.0, + "end": 83.44, + "confidence": 0.433 + } + ] + }, + { + "id": 24, + "seek": 8210, + "start": 83.98, + "end": 87.86, + "text": " Donc, à objets inédits, rapport inédits.", + "tokens": [ + 50440, + 7477, + 11, + 1531, + 1111, + 25349, + 294, + 7811, + 1208, + 11, + 18018, + 294, + 7811, + 1208, + 13, + 50640 + ], + "temperature": 0.0, + "avg_logprob": -0.45904387403654573, + "compression_ratio": 1.6159169550173011, + "no_speech_prob": 0.2066797912120819, + "confidence": 0.745, + "words": [ + { + "text": "Donc,", + "start": 83.98, + "end": 84.46, + "confidence": 0.833 + }, + { + "text": "à", + "start": 84.56, + "end": 84.96, + "confidence": 0.696 + }, + { + "text": "objets", + "start": 84.96, + "end": 85.44, + "confidence": 0.526 + }, + { + "text": "inédits,", + "start": 85.44, + "end": 86.24, + "confidence": 0.701 + }, + { + "text": "rapport", + "start": 86.32, + "end": 86.92, + "confidence": 0.944 + }, + { + "text": "inédits.", + "start": 86.92, + "end": 87.86, + "confidence": 0.908 + } + ] + }, + { + "id": 25, + "seek": 8210, + "start": 88.1, + "end": 94.2, + "text": " Et, ce rapport, si j'en prends Nicolas, frère caractérisée par un mélange de dépendance", + "tokens": [ + 50640, + 3790, + 11, + 1769, + 18018, + 11, + 1511, + 361, + 6, + 268, + 46750, + 38268, + 11, + 431, + 4212, + 1032, + 578, + 4198, + 50027, + 971, + 517, + 41953, + 933, + 368, + 45768, + 719, + 50972 + ], + "temperature": 0.0, + "avg_logprob": -0.45904387403654573, + "compression_ratio": 1.6159169550173011, + "no_speech_prob": 0.2066797912120819, + "confidence": 0.669, + "words": [ + { + "text": "Et,", + "start": 88.1, + "end": 88.3, + "confidence": 0.865 + }, + { + "text": "ce", + "start": 88.58, + "end": 88.84, + "confidence": 0.277 + }, + { + "text": "rapport,", + "start": 88.84, + "end": 89.28, + "confidence": 0.998 + }, + { + "text": "si", + "start": 89.38, + "end": 89.56, + "confidence": 0.933 + }, + { + "text": "j'en", + "start": 89.56, + "end": 89.74, + "confidence": 0.78 + }, + { + "text": "prends", + "start": 89.74, + "end": 89.92, + "confidence": 0.307 + }, + { + "text": "Nicolas,", + "start": 89.92, + "end": 90.22, + "confidence": 0.65 + }, + { + "text": "frère", + "start": 90.78, + "end": 91.1, + "confidence": 0.431 + }, + { + "text": "caractérisée", + "start": 91.1, + "end": 91.8, + "confidence": 0.595 + }, + { + "text": "par", + "start": 91.8, + "end": 92.14, + "confidence": 0.907 + }, + { + "text": "un", + "start": 92.14, + "end": 92.34, + "confidence": 0.989 + }, + { + "text": "mélange", + "start": 92.34, + "end": 92.98, + "confidence": 0.92 + }, + { + "text": "de", + "start": 92.98, + "end": 93.24, + "confidence": 0.842 + }, + { + "text": "dépendance", + "start": 93.24, + "end": 94.2, + "confidence": 0.675 + } + ] + }, + { + "id": 26, + "seek": 8210, + "start": 94.36, + "end": 95.08, + "text": " et de rogeur.", + "tokens": [ + 50972, + 1030, + 368, + 744, + 432, + 374, + 13, + 51022 + ], + "temperature": 0.0, + "avg_logprob": -0.45904387403654573, + "compression_ratio": 1.6159169550173011, + "no_speech_prob": 0.2066797912120819, + "confidence": 0.851, + "words": [ + { + "text": "et", + "start": 94.36, + "end": 94.52, + "confidence": 0.97 + }, + { + "text": "de", + "start": 94.52, + "end": 94.64, + "confidence": 0.996 + }, + { + "text": "rogeur.", + "start": 94.64, + "end": 95.08, + "confidence": 0.773 + } + ] + }, + { + "id": 27, + "seek": 8210, + "start": 96.3, + "end": 100.48, + "text": " Bon, en vrai, il faudrait remonter très, très filmant tout l'histoire des objectes", + "tokens": [ + 51022, + 7368, + 11, + 465, + 17815, + 11, + 1930, + 38694, + 8645, + 890, + 41806, + 5732, + 11, + 5732, + 2007, + 394, + 3486, + 287, + 6, + 29093, + 730, + 2657, + 279, + 51286 + ], + "temperature": 0.0, + "avg_logprob": -0.45904387403654573, + "compression_ratio": 1.6159169550173011, + "no_speech_prob": 0.2066797912120819, + "confidence": 0.752, + "words": [ + { + "text": "Bon,", + "start": 96.3, + "end": 96.32, + "confidence": 0.6 + }, + { + "text": "en", + "start": 96.36, + "end": 96.58, + "confidence": 0.918 + }, + { + "text": "vrai,", + "start": 96.58, + "end": 96.92, + "confidence": 0.992 + }, + { + "text": "il", + "start": 97.14, + "end": 97.18, + "confidence": 0.987 + }, + { + "text": "faudrait", + "start": 97.18, + "end": 97.56, + "confidence": 0.933 + }, + { + "text": "remonter", + "start": 97.56, + "end": 98.08, + "confidence": 0.61 + }, + { + "text": "très,", + "start": 98.08, + "end": 98.56, + "confidence": 0.975 + }, + { + "text": "très", + "start": 98.56, + "end": 98.86, + "confidence": 0.986 + }, + { + "text": "filmant", + "start": 98.86, + "end": 99.42, + "confidence": 0.409 + }, + { + "text": "tout", + "start": 99.42, + "end": 99.68, + "confidence": 0.348 + }, + { + "text": "l'histoire", + "start": 99.68, + "end": 100.08, + "confidence": 0.876 + }, + { + "text": "des", + "start": 100.08, + "end": 100.22, + "confidence": 0.957 + }, + { + "text": "objectes", + "start": 100.22, + "end": 100.48, + "confidence": 0.842 + } + ] + }, + { + "id": 28, + "seek": 8210, + "start": 100.48, + "end": 105.24, + "text": " techniques et de leur infertion dans nos vieux pour déterminer si ce rapport est totalement", + "tokens": [ + 51286, + 7512, + 1030, + 368, + 9580, + 1536, + 911, + 313, + 2680, + 3269, + 4941, + 2449, + 2016, + 2795, + 29725, + 260, + 1511, + 1769, + 18018, + 871, + 45203, + 51530 + ], + "temperature": 0.0, + "avg_logprob": -0.45904387403654573, + "compression_ratio": 1.6159169550173011, + "no_speech_prob": 0.2066797912120819, + "confidence": 0.614, + "words": [ + { + "text": "techniques", + "start": 100.48, + "end": 101.0, + "confidence": 0.952 + }, + { + "text": "et", + "start": 101.0, + "end": 101.58, + "confidence": 0.943 + }, + { + "text": "de", + "start": 101.58, + "end": 101.72, + "confidence": 0.975 + }, + { + "text": "leur", + "start": 101.72, + "end": 101.8, + "confidence": 0.803 + }, + { + "text": "infertion", + "start": 101.8, + "end": 102.34, + "confidence": 0.382 + }, + { + "text": "dans", + "start": 102.34, + "end": 102.5, + "confidence": 0.297 + }, + { + "text": "nos", + "start": 102.5, + "end": 102.68, + "confidence": 0.419 + }, + { + "text": "vieux", + "start": 102.68, + "end": 103.08, + "confidence": 0.386 + }, + { + "text": "pour", + "start": 103.08, + "end": 103.1, + "confidence": 0.281 + }, + { + "text": "déterminer", + "start": 103.1, + "end": 103.64, + "confidence": 0.976 + }, + { + "text": "si", + "start": 103.64, + "end": 103.8, + "confidence": 0.367 + }, + { + "text": "ce", + "start": 103.8, + "end": 103.92, + "confidence": 0.983 + }, + { + "text": "rapport", + "start": 103.92, + "end": 104.22, + "confidence": 0.998 + }, + { + "text": "est", + "start": 104.22, + "end": 104.88, + "confidence": 0.942 + }, + { + "text": "totalement", + "start": 104.88, + "end": 105.24, + "confidence": 0.907 + } + ] + }, + { + "id": 29, + "seek": 8210, + "start": 105.24, + "end": 106.1, + "text": " inédit.", + "tokens": [ + 51530, + 294, + 7811, + 270, + 13, + 51580 + ], + "temperature": 0.0, + "avg_logprob": -0.45904387403654573, + "compression_ratio": 1.6159169550173011, + "no_speech_prob": 0.2066797912120819, + "confidence": 0.939, + "words": [ + { + "text": "inédit.", + "start": 105.24, + "end": 106.1, + "confidence": 0.939 + } + ] + }, + { + "id": 30, + "seek": 8210, + "start": 106.16, + "end": 109.44, + "text": " Mais j'ai l'impression comme ça que Nicolas se trompe pas vraiment.", + "tokens": [ + 51580, + 6313, + 361, + 6, + 1301, + 287, + 6, + 36107, + 5173, + 2788, + 631, + 38268, + 369, + 504, + 298, + 494, + 1736, + 8322, + 13, + 51738 + ], + "temperature": 0.0, + "avg_logprob": -0.45904387403654573, + "compression_ratio": 1.6159169550173011, + "no_speech_prob": 0.2066797912120819, + "confidence": 0.811, + "words": [ + { + "text": "Mais", + "start": 106.16, + "end": 106.5, + "confidence": 0.721 + }, + { + "text": "j'ai", + "start": 106.5, + "end": 106.92, + "confidence": 0.91 + }, + { + "text": "l'impression", + "start": 106.92, + "end": 107.34, + "confidence": 0.956 + }, + { + "text": "comme", + "start": 107.34, + "end": 107.58, + "confidence": 0.7 + }, + { + "text": "ça", + "start": 107.58, + "end": 107.74, + "confidence": 0.953 + }, + { + "text": "que", + "start": 107.74, + "end": 108.06, + "confidence": 0.941 + }, + { + "text": "Nicolas", + "start": 108.06, + "end": 108.46, + "confidence": 0.994 + }, + { + "text": "se", + "start": 108.46, + "end": 108.68, + "confidence": 0.716 + }, + { + "text": "trompe", + "start": 108.68, + "end": 109.02, + "confidence": 0.54 + }, + { + "text": "pas", + "start": 109.02, + "end": 109.16, + "confidence": 0.886 + }, + { + "text": "vraiment.", + "start": 109.16, + "end": 109.44, + "confidence": 0.963 + } + ] + }, + { + "id": 31, + "seek": 8210, + "start": 109.92, + "end": 110.86, + "text": " Pour autant, je sache.", + "tokens": [ + 51738, + 8732, + 34081, + 11, + 1506, + 262, + 6000, + 13, + 51808 + ], + "temperature": 0.0, + "avg_logprob": -0.45904387403654573, + "compression_ratio": 1.6159169550173011, + "no_speech_prob": 0.2066797912120819, + "confidence": 0.6, + "words": [ + { + "text": "Pour", + "start": 109.92, + "end": 110.1, + "confidence": 0.49 + }, + { + "text": "autant,", + "start": 110.1, + "end": 110.28, + "confidence": 0.75 + }, + { + "text": "je", + "start": 110.42, + "end": 110.48, + "confidence": 0.931 + }, + { + "text": "sache.", + "start": 110.48, + "end": 110.86, + "confidence": 0.477 + } + ] + }, + { + "id": 32, + "seek": 11098, + "start": 111.04, + "end": 115.0, + "text": " Il y a eu plein de discussions autour de la voiture ou même du téléphone.", + "tokens": [ + 50364, + 4416, + 288, + 257, + 2228, + 21088, + 368, + 11088, + 30249, + 368, + 635, + 38859, + 2820, + 5698, + 1581, + 47159, + 13, + 50568 + ], + "temperature": 0.0, + "avg_logprob": -0.44320285092493533, + "compression_ratio": 1.7050847457627119, + "no_speech_prob": 0.15390530228614807, + "confidence": 0.821, + "words": [ + { + "text": "Il", + "start": 111.04, + "end": 111.2, + "confidence": 0.905 + }, + { + "text": "y", + "start": 111.2, + "end": 111.3, + "confidence": 0.934 + }, + { + "text": "a", + "start": 111.3, + "end": 111.56, + "confidence": 0.893 + }, + { + "text": "eu", + "start": 111.56, + "end": 111.6, + "confidence": 0.839 + }, + { + "text": "plein", + "start": 111.6, + "end": 111.88, + "confidence": 0.776 + }, + { + "text": "de", + "start": 111.88, + "end": 112.12, + "confidence": 0.944 + }, + { + "text": "discussions", + "start": 112.12, + "end": 112.6, + "confidence": 0.681 + }, + { + "text": "autour", + "start": 112.6, + "end": 113.04, + "confidence": 0.978 + }, + { + "text": "de", + "start": 113.04, + "end": 113.48, + "confidence": 0.975 + }, + { + "text": "la", + "start": 113.48, + "end": 113.56, + "confidence": 0.966 + }, + { + "text": "voiture", + "start": 113.56, + "end": 113.88, + "confidence": 0.983 + }, + { + "text": "ou", + "start": 113.88, + "end": 114.14, + "confidence": 0.66 + }, + { + "text": "même", + "start": 114.14, + "end": 114.34, + "confidence": 0.99 + }, + { + "text": "du", + "start": 114.34, + "end": 114.64, + "confidence": 0.283 + }, + { + "text": "téléphone.", + "start": 114.64, + "end": 115.0, + "confidence": 0.986 + } + ] + }, + { + "id": 33, + "seek": 11098, + "start": 115.52, + "end": 119.51, + "text": " Mais, la dépense n'était pas du même mort, donc le rejet n'en plus n'était pas du même", + "tokens": [ + 50568, + 6313, + 11, + 635, + 27998, + 1288, + 297, + 6, + 9743, + 1736, + 1581, + 5698, + 6599, + 11, + 5926, + 476, + 319, + 7108, + 297, + 6, + 268, + 1804, + 297, + 6, + 9743, + 1736, + 1581, + 5698, + 50790 + ], + "temperature": 0.0, + "avg_logprob": -0.44320285092493533, + "compression_ratio": 1.7050847457627119, + "no_speech_prob": 0.15390530228614807, + "confidence": 0.701, + "words": [ + { + "text": "Mais,", + "start": 115.52, + "end": 115.82, + "confidence": 0.983 + }, + { + "text": "la", + "start": 115.9, + "end": 116.0, + "confidence": 0.961 + }, + { + "text": "dépense", + "start": 116.0, + "end": 116.42, + "confidence": 0.616 + }, + { + "text": "n'était", + "start": 116.42, + "end": 116.82, + "confidence": 0.955 + }, + { + "text": "pas", + "start": 116.82, + "end": 117.04, + "confidence": 0.994 + }, + { + "text": "du", + "start": 117.04, + "end": 117.2, + "confidence": 0.958 + }, + { + "text": "même", + "start": 117.2, + "end": 117.38, + "confidence": 0.929 + }, + { + "text": "mort,", + "start": 117.38, + "end": 117.58, + "confidence": 0.686 + }, + { + "text": "donc", + "start": 117.7, + "end": 118.02, + "confidence": 0.932 + }, + { + "text": "le", + "start": 118.02, + "end": 118.34, + "confidence": 0.95 + }, + { + "text": "rejet", + "start": 118.34, + "end": 118.64, + "confidence": 0.57 + }, + { + "text": "n'en", + "start": 118.64, + "end": 118.82, + "confidence": 0.429 + }, + { + "text": "plus", + "start": 118.82, + "end": 118.96, + "confidence": 0.055 + }, + { + "text": "n'était", + "start": 118.96, + "end": 119.16, + "confidence": 0.973 + }, + { + "text": "pas", + "start": 119.16, + "end": 119.32, + "confidence": 0.993 + }, + { + "text": "du", + "start": 119.32, + "end": 119.42, + "confidence": 0.823 + }, + { + "text": "même", + "start": 119.42, + "end": 119.51, + "confidence": 0.79 + } + ] + }, + { + "id": 34, + "seek": 11098, + "start": 119.51, + "end": 119.72, + "text": " mort.", + "tokens": [ + 50790, + 6599, + 13, + 50840 + ], + "temperature": 0.0, + "avg_logprob": -0.44320285092493533, + "compression_ratio": 1.7050847457627119, + "no_speech_prob": 0.15390530228614807, + "confidence": 0.639, + "words": [ + { + "text": "mort.", + "start": 119.51, + "end": 119.72, + "confidence": 0.639 + } + ] + }, + { + "id": 35, + "seek": 11098, + "start": 120.04, + "end": 121.24, + "text": " On peut adorer sa bagnure.", + "tokens": [ + 50840, + 1282, + 5977, + 614, + 17618, + 601, + 3411, + 77, + 540, + 13, + 50890 + ], + "temperature": 0.0, + "avg_logprob": -0.44320285092493533, + "compression_ratio": 1.7050847457627119, + "no_speech_prob": 0.15390530228614807, + "confidence": 0.615, + "words": [ + { + "text": "On", + "start": 120.04, + "end": 120.22, + "confidence": 0.981 + }, + { + "text": "peut", + "start": 120.22, + "end": 120.36, + "confidence": 0.988 + }, + { + "text": "adorer", + "start": 120.36, + "end": 120.7, + "confidence": 0.859 + }, + { + "text": "sa", + "start": 120.7, + "end": 120.88, + "confidence": 0.918 + }, + { + "text": "bagnure.", + "start": 120.88, + "end": 121.24, + "confidence": 0.314 + } + ] + }, + { + "id": 36, + "seek": 11098, + "start": 121.38, + "end": 123.06, + "text": " On a par besoin pour plein de choses.", + "tokens": [ + 50890, + 1282, + 257, + 971, + 19207, + 2016, + 21088, + 368, + 14488, + 13, + 50972 + ], + "temperature": 0.0, + "avg_logprob": -0.44320285092493533, + "compression_ratio": 1.7050847457627119, + "no_speech_prob": 0.15390530228614807, + "confidence": 0.722, + "words": [ + { + "text": "On", + "start": 121.38, + "end": 121.56, + "confidence": 0.897 + }, + { + "text": "a", + "start": 121.56, + "end": 121.64, + "confidence": 0.656 + }, + { + "text": "par", + "start": 121.64, + "end": 121.8, + "confidence": 0.161 + }, + { + "text": "besoin", + "start": 121.8, + "end": 122.12, + "confidence": 0.947 + }, + { + "text": "pour", + "start": 122.12, + "end": 122.5, + "confidence": 0.976 + }, + { + "text": "plein", + "start": 122.5, + "end": 122.72, + "confidence": 0.857 + }, + { + "text": "de", + "start": 122.72, + "end": 122.8, + "confidence": 0.993 + }, + { + "text": "choses.", + "start": 122.8, + "end": 123.06, + "confidence": 0.989 + } + ] + }, + { + "id": 37, + "seek": 11098, + "start": 123.36, + "end": 126.46, + "text": " Et là, le soir, quand on va se coucher, on la laisse.", + "tokens": [ + 50972, + 3790, + 3684, + 11, + 476, + 27105, + 11, + 6932, + 322, + 2773, + 369, + 1384, + 6759, + 11, + 322, + 635, + 30969, + 13, + 51142 + ], + "temperature": 0.0, + "avg_logprob": -0.44320285092493533, + "compression_ratio": 1.7050847457627119, + "no_speech_prob": 0.15390530228614807, + "confidence": 0.835, + "words": [ + { + "text": "Et", + "start": 123.36, + "end": 123.5, + "confidence": 0.606 + }, + { + "text": "là,", + "start": 123.5, + "end": 123.76, + "confidence": 0.498 + }, + { + "text": "le", + "start": 123.82, + "end": 124.06, + "confidence": 0.986 + }, + { + "text": "soir,", + "start": 124.06, + "end": 124.42, + "confidence": 0.971 + }, + { + "text": "quand", + "start": 124.84, + "end": 124.96, + "confidence": 0.787 + }, + { + "text": "on", + "start": 124.96, + "end": 125.06, + "confidence": 0.988 + }, + { + "text": "va", + "start": 125.06, + "end": 125.18, + "confidence": 0.966 + }, + { + "text": "se", + "start": 125.18, + "end": 125.26, + "confidence": 0.869 + }, + { + "text": "coucher,", + "start": 125.26, + "end": 125.6, + "confidence": 0.804 + }, + { + "text": "on", + "start": 125.82, + "end": 126.06, + "confidence": 0.98 + }, + { + "text": "la", + "start": 126.06, + "end": 126.2, + "confidence": 0.811 + }, + { + "text": "laisse.", + "start": 126.2, + "end": 126.46, + "confidence": 0.985 + } + ] + }, + { + "id": 38, + "seek": 11098, + "start": 127.06, + "end": 130.1, + "text": " On la pade en la main quand on est colis, qu'on n'a même pas au chiot.", + "tokens": [ + 51142, + 1282, + 635, + 280, + 762, + 465, + 635, + 2135, + 6932, + 322, + 871, + 1173, + 271, + 11, + 421, + 6, + 266, + 297, + 6, + 64, + 5698, + 1736, + 1609, + 417, + 6471, + 13, + 51334 + ], + "temperature": 0.0, + "avg_logprob": -0.44320285092493533, + "compression_ratio": 1.7050847457627119, + "no_speech_prob": 0.15390530228614807, + "confidence": 0.542, + "words": [ + { + "text": "On", + "start": 127.06, + "end": 127.32, + "confidence": 0.605 + }, + { + "text": "la", + "start": 127.32, + "end": 127.5, + "confidence": 0.35 + }, + { + "text": "pade", + "start": 127.5, + "end": 127.72, + "confidence": 0.18 + }, + { + "text": "en", + "start": 127.72, + "end": 127.88, + "confidence": 0.775 + }, + { + "text": "la", + "start": 127.88, + "end": 128.04, + "confidence": 0.795 + }, + { + "text": "main", + "start": 128.04, + "end": 128.3, + "confidence": 0.971 + }, + { + "text": "quand", + "start": 128.3, + "end": 128.46, + "confidence": 0.483 + }, + { + "text": "on", + "start": 128.46, + "end": 128.62, + "confidence": 0.994 + }, + { + "text": "est", + "start": 128.62, + "end": 128.74, + "confidence": 0.714 + }, + { + "text": "colis,", + "start": 128.74, + "end": 129.12, + "confidence": 0.501 + }, + { + "text": "qu'on", + "start": 129.22, + "end": 129.32, + "confidence": 0.777 + }, + { + "text": "n'a", + "start": 129.32, + "end": 129.42, + "confidence": 0.439 + }, + { + "text": "même", + "start": 129.42, + "end": 129.56, + "confidence": 0.324 + }, + { + "text": "pas", + "start": 129.56, + "end": 129.74, + "confidence": 1.0 + }, + { + "text": "au", + "start": 129.74, + "end": 129.88, + "confidence": 0.64 + }, + { + "text": "chiot.", + "start": 129.88, + "end": 130.1, + "confidence": 0.514 + } + ] + }, + { + "id": 39, + "seek": 11098, + "start": 130.94, + "end": 135.32, + "text": " On pouvait être émervé par son mome qui occupeait la ligne de téléphone pendant une heure", + "tokens": [ + 51334, + 1282, + 45913, + 7418, + 1136, + 936, + 15797, + 971, + 1872, + 275, + 423, + 1956, + 2678, + 84, + 494, + 1001, + 635, + 34207, + 368, + 47159, + 17338, + 2251, + 30027, + 51574 + ], + "temperature": 0.0, + "avg_logprob": -0.44320285092493533, + "compression_ratio": 1.7050847457627119, + "no_speech_prob": 0.15390530228614807, + "confidence": 0.656, + "words": [ + { + "text": "On", + "start": 130.94, + "end": 131.04, + "confidence": 0.99 + }, + { + "text": "pouvait", + "start": 131.04, + "end": 131.28, + "confidence": 0.588 + }, + { + "text": "être", + "start": 131.28, + "end": 131.6, + "confidence": 0.446 + }, + { + "text": "émervé", + "start": 131.6, + "end": 132.24, + "confidence": 0.725 + }, + { + "text": "par", + "start": 132.24, + "end": 132.5, + "confidence": 0.848 + }, + { + "text": "son", + "start": 132.5, + "end": 132.7, + "confidence": 0.445 + }, + { + "text": "mome", + "start": 132.7, + "end": 133.08, + "confidence": 0.255 + }, + { + "text": "qui", + "start": 133.08, + "end": 133.3, + "confidence": 0.911 + }, + { + "text": "occupeait", + "start": 133.3, + "end": 133.74, + "confidence": 0.642 + }, + { + "text": "la", + "start": 133.74, + "end": 133.86, + "confidence": 0.808 + }, + { + "text": "ligne", + "start": 133.86, + "end": 134.02, + "confidence": 0.975 + }, + { + "text": "de", + "start": 134.02, + "end": 134.24, + "confidence": 0.928 + }, + { + "text": "téléphone", + "start": 134.24, + "end": 134.56, + "confidence": 0.978 + }, + { + "text": "pendant", + "start": 134.56, + "end": 134.92, + "confidence": 0.901 + }, + { + "text": "une", + "start": 134.92, + "end": 135.18, + "confidence": 0.811 + }, + { + "text": "heure", + "start": 135.18, + "end": 135.32, + "confidence": 0.477 + } + ] + }, + { + "id": 40, + "seek": 11098, + "start": 135.32, + "end": 137.04, + "text": " chaque soir pour discuter avec un copain.", + "tokens": [ + 51574, + 18920, + 27105, + 2016, + 2983, + 20314, + 4163, + 517, + 2971, + 491, + 13, + 51664 + ], + "temperature": 0.0, + "avg_logprob": -0.44320285092493533, + "compression_ratio": 1.7050847457627119, + "no_speech_prob": 0.15390530228614807, + "confidence": 0.955, + "words": [ + { + "text": "chaque", + "start": 135.32, + "end": 135.6, + "confidence": 0.99 + }, + { + "text": "soir", + "start": 135.6, + "end": 135.8, + "confidence": 0.997 + }, + { + "text": "pour", + "start": 135.8, + "end": 136.0, + "confidence": 0.981 + }, + { + "text": "discuter", + "start": 136.0, + "end": 136.34, + "confidence": 0.882 + }, + { + "text": "avec", + "start": 136.34, + "end": 136.5, + "confidence": 0.993 + }, + { + "text": "un", + "start": 136.5, + "end": 136.62, + "confidence": 0.967 + }, + { + "text": "copain.", + "start": 136.62, + "end": 137.04, + "confidence": 0.953 + } + ] + }, + { + "id": 41, + "seek": 13698, + "start": 137.32, + "end": 141.84, + "text": " Mais ça ne ressemble pas à ce qu'on peut ressentir à voir même mome aujourd'hui.", + "tokens": [ + 50376, + 6313, + 2788, + 408, + 725, + 37227, + 1736, + 1531, + 1769, + 421, + 6, + 266, + 5977, + 24689, + 317, + 347, + 1531, + 10695, + 5698, + 275, + 423, + 14023, + 6, + 10556, + 13, + 50606 + ], + "temperature": 0.0, + "avg_logprob": -0.5337450312471937, + "compression_ratio": 1.6231454005934718, + "no_speech_prob": 0.1096271350979805, + "confidence": 0.735, + "words": [ + { + "text": "Mais", + "start": 137.32, + "end": 137.52, + "confidence": 0.984 + }, + { + "text": "ça", + "start": 137.52, + "end": 137.7, + "confidence": 0.877 + }, + { + "text": "ne", + "start": 137.7, + "end": 137.8, + "confidence": 0.672 + }, + { + "text": "ressemble", + "start": 137.8, + "end": 138.22, + "confidence": 0.731 + }, + { + "text": "pas", + "start": 138.22, + "end": 138.76, + "confidence": 0.526 + }, + { + "text": "à", + "start": 138.76, + "end": 138.94, + "confidence": 0.98 + }, + { + "text": "ce", + "start": 138.94, + "end": 139.08, + "confidence": 0.578 + }, + { + "text": "qu'on", + "start": 139.08, + "end": 139.22, + "confidence": 0.96 + }, + { + "text": "peut", + "start": 139.22, + "end": 139.38, + "confidence": 0.547 + }, + { + "text": "ressentir", + "start": 139.38, + "end": 140.06, + "confidence": 0.888 + }, + { + "text": "à", + "start": 140.06, + "end": 140.26, + "confidence": 0.437 + }, + { + "text": "voir", + "start": 140.26, + "end": 140.54, + "confidence": 0.952 + }, + { + "text": "même", + "start": 140.54, + "end": 140.96, + "confidence": 0.297 + }, + { + "text": "mome", + "start": 140.96, + "end": 141.22, + "confidence": 0.496 + }, + { + "text": "aujourd'hui.", + "start": 141.22, + "end": 141.84, + "confidence": 0.961 + } + ] + }, + { + "id": 42, + "seek": 13698, + "start": 141.96, + "end": 145.86, + "text": " Continuellement avec son smartphone dans la main, comme c'était une sorte de estimateur", + "tokens": [ + 50606, + 14674, + 31816, + 4163, + 1872, + 13307, + 2680, + 635, + 2135, + 11, + 5173, + 269, + 6, + 9743, + 2251, + 25559, + 368, + 8017, + 15540, + 50810 + ], + "temperature": 0.0, + "avg_logprob": -0.5337450312471937, + "compression_ratio": 1.6231454005934718, + "no_speech_prob": 0.1096271350979805, + "confidence": 0.663, + "words": [ + { + "text": "Continuellement", + "start": 141.96, + "end": 142.84, + "confidence": 0.844 + }, + { + "text": "avec", + "start": 142.84, + "end": 143.24, + "confidence": 0.646 + }, + { + "text": "son", + "start": 143.24, + "end": 143.42, + "confidence": 0.864 + }, + { + "text": "smartphone", + "start": 143.42, + "end": 143.72, + "confidence": 0.447 + }, + { + "text": "dans", + "start": 143.72, + "end": 143.92, + "confidence": 0.587 + }, + { + "text": "la", + "start": 143.92, + "end": 144.0, + "confidence": 0.974 + }, + { + "text": "main,", + "start": 144.0, + "end": 144.3, + "confidence": 0.995 + }, + { + "text": "comme", + "start": 144.42, + "end": 144.56, + "confidence": 0.895 + }, + { + "text": "c'était", + "start": 144.56, + "end": 144.84, + "confidence": 0.596 + }, + { + "text": "une", + "start": 144.84, + "end": 144.96, + "confidence": 0.972 + }, + { + "text": "sorte", + "start": 144.96, + "end": 145.1, + "confidence": 0.658 + }, + { + "text": "de", + "start": 145.1, + "end": 145.4, + "confidence": 0.312 + }, + { + "text": "estimateur", + "start": 145.4, + "end": 145.86, + "confidence": 0.489 + } + ] + }, + { + "id": 43, + "seek": 13698, + "start": 145.96, + "end": 149.0, + "text": " extère de tomber de lâcher à l'éantrénée, ça m'a eu immédiate.", + "tokens": [ + 50810, + 1279, + 4212, + 368, + 2916, + 607, + 368, + 48835, + 6759, + 1531, + 287, + 6, + 526, + 394, + 81, + 3516, + 3856, + 11, + 2788, + 275, + 6, + 64, + 2228, + 3397, + 526, + 4504, + 473, + 13, + 50954 + ], + "temperature": 0.0, + "avg_logprob": -0.5337450312471937, + "compression_ratio": 1.6231454005934718, + "no_speech_prob": 0.1096271350979805, + "confidence": 0.416, + "words": [ + { + "text": "extère", + "start": 145.96, + "end": 146.4, + "confidence": 0.371 + }, + { + "text": "de", + "start": 146.4, + "end": 146.54, + "confidence": 0.254 + }, + { + "text": "tomber", + "start": 146.54, + "end": 146.7, + "confidence": 0.102 + }, + { + "text": "de", + "start": 146.7, + "end": 146.9, + "confidence": 0.454 + }, + { + "text": "lâcher", + "start": 146.9, + "end": 147.34, + "confidence": 0.75 + }, + { + "text": "à", + "start": 147.34, + "end": 147.46, + "confidence": 0.444 + }, + { + "text": "l'éantrénée,", + "start": 147.46, + "end": 147.9, + "confidence": 0.491 + }, + { + "text": "ça", + "start": 148.0, + "end": 148.02, + "confidence": 0.799 + }, + { + "text": "m'a", + "start": 148.02, + "end": 148.26, + "confidence": 0.531 + }, + { + "text": "eu", + "start": 148.26, + "end": 148.44, + "confidence": 0.136 + }, + { + "text": "immédiate.", + "start": 148.44, + "end": 149.0, + "confidence": 0.505 + } + ] + }, + { + "id": 44, + "seek": 13698, + "start": 149.08, + "end": 151.98, + "text": " Bon, je dis ça pour le mome, mais évidemment, va là, bon aussi.", + "tokens": [ + 50954, + 7368, + 11, + 1506, + 717, + 2788, + 2016, + 476, + 275, + 423, + 11, + 2420, + 24724, + 11, + 2773, + 3684, + 11, + 4428, + 6212, + 13, + 51126 + ], + "temperature": 0.0, + "avg_logprob": -0.5337450312471937, + "compression_ratio": 1.6231454005934718, + "no_speech_prob": 0.1096271350979805, + "confidence": 0.564, + "words": [ + { + "text": "Bon,", + "start": 149.08, + "end": 149.28, + "confidence": 0.375 + }, + { + "text": "je", + "start": 149.34, + "end": 149.4, + "confidence": 0.471 + }, + { + "text": "dis", + "start": 149.4, + "end": 149.46, + "confidence": 0.324 + }, + { + "text": "ça", + "start": 149.46, + "end": 149.64, + "confidence": 0.952 + }, + { + "text": "pour", + "start": 149.64, + "end": 149.8, + "confidence": 0.963 + }, + { + "text": "le", + "start": 149.8, + "end": 149.92, + "confidence": 0.992 + }, + { + "text": "mome,", + "start": 149.92, + "end": 150.12, + "confidence": 0.619 + }, + { + "text": "mais", + "start": 150.46, + "end": 150.52, + "confidence": 0.694 + }, + { + "text": "évidemment,", + "start": 150.52, + "end": 151.12, + "confidence": 0.776 + }, + { + "text": "va", + "start": 151.26, + "end": 151.36, + "confidence": 0.388 + }, + { + "text": "là,", + "start": 151.36, + "end": 151.46, + "confidence": 0.59 + }, + { + "text": "bon", + "start": 151.6, + "end": 151.68, + "confidence": 0.825 + }, + { + "text": "aussi.", + "start": 151.68, + "end": 151.98, + "confidence": 0.162 + } + ] + }, + { + "id": 45, + "seek": 13698, + "start": 152.64, + "end": 154.64, + "text": " Donc, rapport immédiate d'accord.", + "tokens": [ + 51126, + 7477, + 11, + 18018, + 3397, + 526, + 4504, + 473, + 274, + 6, + 19947, + 13, + 51248 + ], + "temperature": 0.0, + "avg_logprob": -0.5337450312471937, + "compression_ratio": 1.6231454005934718, + "no_speech_prob": 0.1096271350979805, + "confidence": 0.861, + "words": [ + { + "text": "Donc,", + "start": 152.64, + "end": 153.08, + "confidence": 0.982 + }, + { + "text": "rapport", + "start": 153.16, + "end": 153.58, + "confidence": 0.979 + }, + { + "text": "immédiate", + "start": 153.58, + "end": 154.28, + "confidence": 0.841 + }, + { + "text": "d'accord.", + "start": 154.28, + "end": 154.64, + "confidence": 0.816 + } + ] + }, + { + "id": 46, + "seek": 13698, + "start": 155.66, + "end": 158.36, + "text": " Mais pourquoi, à ton impression qu'on en sortira, j'amé?", + "tokens": [ + 51248, + 6313, + 19934, + 11, + 1531, + 2952, + 9995, + 421, + 6, + 266, + 465, + 26906, + 64, + 11, + 361, + 6, + 335, + 526, + 30, + 51440 + ], + "temperature": 0.0, + "avg_logprob": -0.5337450312471937, + "compression_ratio": 1.6231454005934718, + "no_speech_prob": 0.1096271350979805, + "confidence": 0.709, + "words": [ + { + "text": "Mais", + "start": 155.66, + "end": 155.88, + "confidence": 0.984 + }, + { + "text": "pourquoi,", + "start": 155.88, + "end": 156.28, + "confidence": 0.897 + }, + { + "text": "à", + "start": 156.38, + "end": 156.58, + "confidence": 0.837 + }, + { + "text": "ton", + "start": 156.58, + "end": 156.7, + "confidence": 0.953 + }, + { + "text": "impression", + "start": 156.7, + "end": 157.06, + "confidence": 0.938 + }, + { + "text": "qu'on", + "start": 157.06, + "end": 157.28, + "confidence": 0.89 + }, + { + "text": "en", + "start": 157.28, + "end": 157.4, + "confidence": 0.801 + }, + { + "text": "sortira,", + "start": 157.4, + "end": 157.88, + "confidence": 0.576 + }, + { + "text": "j'amé?", + "start": 157.96, + "end": 158.36, + "confidence": 0.464 + } + ] + }, + { + "id": 47, + "seek": 13698, + "start": 159.16, + "end": 163.32, + "text": " Et puis, il faut en remettre la faute sur les gens qui ont créé cette critique merveilleux", + "tokens": [ + 51440, + 3790, + 9093, + 11, + 1930, + 8487, + 465, + 890, + 40681, + 635, + 2050, + 1169, + 1022, + 1512, + 10668, + 1956, + 6592, + 15609, + 526, + 5550, + 25673, + 3551, + 303, + 3409, + 2449, + 51678 + ], + "temperature": 0.0, + "avg_logprob": -0.5337450312471937, + "compression_ratio": 1.6231454005934718, + "no_speech_prob": 0.1096271350979805, + "confidence": 0.714, + "words": [ + { + "text": "Et", + "start": 159.16, + "end": 159.32, + "confidence": 0.832 + }, + { + "text": "puis,", + "start": 159.32, + "end": 159.46, + "confidence": 0.494 + }, + { + "text": "il", + "start": 159.62, + "end": 159.64, + "confidence": 0.594 + }, + { + "text": "faut", + "start": 159.64, + "end": 159.66, + "confidence": 0.951 + }, + { + "text": "en", + "start": 159.66, + "end": 159.78, + "confidence": 0.937 + }, + { + "text": "remettre", + "start": 159.78, + "end": 160.14, + "confidence": 0.984 + }, + { + "text": "la", + "start": 160.14, + "end": 160.42, + "confidence": 0.602 + }, + { + "text": "faute", + "start": 160.42, + "end": 160.68, + "confidence": 0.59 + }, + { + "text": "sur", + "start": 160.68, + "end": 160.98, + "confidence": 0.966 + }, + { + "text": "les", + "start": 160.98, + "end": 161.24, + "confidence": 0.828 + }, + { + "text": "gens", + "start": 161.24, + "end": 161.46, + "confidence": 0.986 + }, + { + "text": "qui", + "start": 161.46, + "end": 161.6, + "confidence": 0.98 + }, + { + "text": "ont", + "start": 161.6, + "end": 161.68, + "confidence": 0.95 + }, + { + "text": "créé", + "start": 161.68, + "end": 162.3, + "confidence": 0.95 + }, + { + "text": "cette", + "start": 162.3, + "end": 162.48, + "confidence": 0.908 + }, + { + "text": "critique", + "start": 162.48, + "end": 162.72, + "confidence": 0.032 + }, + { + "text": "merveilleux", + "start": 162.72, + "end": 163.32, + "confidence": 0.839 + } + ] + }, + { + "id": 48, + "seek": 13698, + "start": 163.32, + "end": 165.34, + "text": " et diabolique et diabolique par que merveilleux.", + "tokens": [ + 51678, + 1030, + 1026, + 14923, + 1925, + 1030, + 1026, + 14923, + 1925, + 971, + 631, + 3551, + 303, + 3409, + 2449, + 13, + 51778 + ], + "temperature": 0.0, + "avg_logprob": -0.5337450312471937, + "compression_ratio": 1.6231454005934718, + "no_speech_prob": 0.1096271350979805, + "confidence": 0.708, + "words": [ + { + "text": "et", + "start": 163.32, + "end": 163.44, + "confidence": 0.945 + }, + { + "text": "diabolique", + "start": 163.44, + "end": 163.86, + "confidence": 0.573 + }, + { + "text": "et", + "start": 163.86, + "end": 163.94, + "confidence": 0.238 + }, + { + "text": "diabolique", + "start": 163.94, + "end": 164.38, + "confidence": 0.892 + }, + { + "text": "par", + "start": 164.38, + "end": 164.62, + "confidence": 0.544 + }, + { + "text": "que", + "start": 164.62, + "end": 164.82, + "confidence": 0.529 + }, + { + "text": "merveilleux.", + "start": 164.82, + "end": 165.34, + "confidence": 0.981 + } + ] + }, + { + "id": 49, + "seek": 16526, + "start": 166.9, + "end": 168.8, + "text": " Les économistes parlent de dépendance du santé.", + "tokens": [ + 50410, + 6965, + 31171, + 22368, + 13734, + 317, + 368, + 45768, + 719, + 1581, + 30068, + 13, + 50542 + ], + "temperature": 0.0, + "avg_logprob": -0.6644235849380493, + "compression_ratio": 1.4761904761904763, + "no_speech_prob": 0.1915542334318161, + "confidence": 0.765, + "words": [ + { + "text": "Les", + "start": 166.9, + "end": 167.06, + "confidence": 0.699 + }, + { + "text": "économistes", + "start": 167.06, + "end": 167.52, + "confidence": 0.917 + }, + { + "text": "parlent", + "start": 167.52, + "end": 167.78, + "confidence": 0.793 + }, + { + "text": "de", + "start": 167.78, + "end": 167.84, + "confidence": 0.813 + }, + { + "text": "dépendance", + "start": 167.84, + "end": 168.36, + "confidence": 0.698 + }, + { + "text": "du", + "start": 168.36, + "end": 168.5, + "confidence": 0.963 + }, + { + "text": "santé.", + "start": 168.5, + "end": 168.8, + "confidence": 0.489 + } + ] + }, + { + "id": 50, + "seek": 16526, + "start": 168.82, + "end": 173.42, + "text": " Ces vidéos, en fait, on est un santé qui a été étabis, un soit mon termine, en marchand dessus,", + "tokens": [ + 50542, + 28414, + 25417, + 11, + 465, + 3887, + 11, + 322, + 871, + 517, + 30068, + 1956, + 257, + 8862, + 4823, + 455, + 271, + 11, + 517, + 12703, + 1108, + 1433, + 533, + 11, + 465, + 8368, + 474, + 30677, + 11, + 50784 + ], + "temperature": 0.0, + "avg_logprob": -0.6644235849380493, + "compression_ratio": 1.4761904761904763, + "no_speech_prob": 0.1915542334318161, + "confidence": 0.474, + "words": [ + { + "text": "Ces", + "start": 168.82, + "end": 169.14, + "confidence": 0.443 + }, + { + "text": "vidéos,", + "start": 169.14, + "end": 169.4, + "confidence": 0.455 + }, + { + "text": "en", + "start": 169.44, + "end": 169.64, + "confidence": 0.744 + }, + { + "text": "fait,", + "start": 169.64, + "end": 169.66, + "confidence": 0.976 + }, + { + "text": "on", + "start": 169.72, + "end": 169.74, + "confidence": 0.303 + }, + { + "text": "est", + "start": 169.74, + "end": 169.9, + "confidence": 0.814 + }, + { + "text": "un", + "start": 169.9, + "end": 170.48, + "confidence": 0.367 + }, + { + "text": "santé", + "start": 170.48, + "end": 170.8, + "confidence": 0.951 + }, + { + "text": "qui", + "start": 170.8, + "end": 170.92, + "confidence": 0.835 + }, + { + "text": "a", + "start": 170.92, + "end": 171.02, + "confidence": 0.819 + }, + { + "text": "été", + "start": 171.02, + "end": 171.12, + "confidence": 0.994 + }, + { + "text": "étabis,", + "start": 171.12, + "end": 171.5, + "confidence": 0.343 + }, + { + "text": "un", + "start": 171.76, + "end": 171.9, + "confidence": 0.236 + }, + { + "text": "soit", + "start": 171.9, + "end": 172.16, + "confidence": 0.31 + }, + { + "text": "mon", + "start": 172.16, + "end": 172.36, + "confidence": 0.205 + }, + { + "text": "termine,", + "start": 172.36, + "end": 172.72, + "confidence": 0.4 + }, + { + "text": "en", + "start": 172.8, + "end": 172.82, + "confidence": 0.309 + }, + { + "text": "marchand", + "start": 172.82, + "end": 173.14, + "confidence": 0.816 + }, + { + "text": "dessus,", + "start": 173.14, + "end": 173.42, + "confidence": 0.201 + } + ] + }, + { + "id": 51, + "seek": 16526, + "start": 173.86, + "end": 177.42, + "text": " soit des finissants débordes, des finissants, une signalétique.", + "tokens": [ + 50784, + 12703, + 730, + 962, + 891, + 1719, + 36529, + 765, + 279, + 11, + 730, + 962, + 891, + 1719, + 11, + 2251, + 6358, + 42379, + 13, + 50974 + ], + "temperature": 0.0, + "avg_logprob": -0.6644235849380493, + "compression_ratio": 1.4761904761904763, + "no_speech_prob": 0.1915542334318161, + "confidence": 0.582, + "words": [ + { + "text": "soit", + "start": 173.86, + "end": 174.4, + "confidence": 0.993 + }, + { + "text": "des", + "start": 174.4, + "end": 175.2, + "confidence": 0.759 + }, + { + "text": "finissants", + "start": 175.2, + "end": 175.58, + "confidence": 0.436 + }, + { + "text": "débordes,", + "start": 175.58, + "end": 175.98, + "confidence": 0.467 + }, + { + "text": "des", + "start": 176.14, + "end": 176.18, + "confidence": 0.222 + }, + { + "text": "finissants,", + "start": 176.18, + "end": 176.62, + "confidence": 0.961 + }, + { + "text": "une", + "start": 176.66, + "end": 176.84, + "confidence": 0.75 + }, + { + "text": "signalétique.", + "start": 176.84, + "end": 177.42, + "confidence": 0.566 + } + ] + } + ], + "language": "fr", + "language_probs": { + "en": 0.003095489228144288, + "zh": 0.0006387902540154755, + "de": 0.0005213654367253184, + "es": 0.0002621589810587466, + "ru": 9.644290548749268e-05, + "ko": 0.0004060397914145142, + "fr": 0.9878895878791809, + "ja": 0.001508620916865766, + "pt": 0.0008202229510061443, + "tr": 0.00010758983989944682, + "pl": 5.243510167929344e-05, + "ca": 5.111286554893013e-06, + "nl": 0.00018159222963731736, + "ar": 0.0003162241482641548, + "sv": 5.988276097923517e-05, + "it": 0.00041243399027734995, + "id": 5.3565827329293825e-06, + "hi": 1.899073504318949e-05, + "fi": 9.529085787107761e-07, + "vi": 1.4905997886671685e-05, + "he": 2.2728934709448367e-05, + "uk": 6.863543262625171e-07, + "el": 1.255210918316152e-05, + "ms": 3.63207291229628e-05, + "cs": 6.311596735031344e-06, + "ro": 1.2261339179531205e-05, + "da": 7.264603482326493e-06, + "hu": 9.775592843652703e-06, + "ta": 7.081414992171631e-07, + "no": 1.378579418087611e-05, + "th": 2.0533880160655826e-05, + "ur": 5.111286554893013e-06, + "hr": 9.435073167196606e-08, + "bg": 2.3956120003276737e-06, + "lt": 3.299109607723949e-08, + "la": 0.00038744587800465524, + "mi": 5.526619133888744e-06, + "ml": 1.522743559689843e-06, + "cy": 3.896646012435667e-05, + "sk": 3.397700254481606e-07, + "te": 1.4386768043550546e-07, + "fa": 3.17366993840551e-06, + "lv": 2.490298456336859e-08, + "bn": 2.2155788883537753e-06, + "sr": 3.273435922324097e-08, + "az": 4.94362438985263e-07, + "sl": 6.347739827106125e-07, + "kn": 3.197606801563779e-08, + "et": 7.761079245938163e-08, + "mk": 1.3515118268969672e-07, + "br": 0.0019371077651157975, + "eu": 1.2749776033160742e-05, + "is": 2.794872102640511e-07, + "hy": 1.2623987686311011e-06, + "ne": 1.2795857173841796e-07, + "mn": 1.9860319753206568e-06, + "bs": 8.26162533940078e-08, + "kk": 1.891105085860545e-07, + "sq": 1.3126870044288808e-06, + "sw": 2.2859089767734986e-06, + "gl": 1.2357507330307271e-05, + "mr": 7.976223770356228e-08, + "pa": 6.249327384466596e-07, + "si": 2.867172270271112e-06, + "km": 2.5158635253319517e-05, + "sn": 2.3086862711352296e-05, + "yo": 2.3634351236978546e-05, + "so": 8.52387884719974e-08, + "af": 5.221507990427199e-07, + "oc": 0.00014821125660091639, + "ka": 2.281108066881643e-07, + "be": 1.1584422736632405e-06, + "tg": 8.308935761647263e-09, + "sd": 1.3864739685232053e-06, + "gu": 6.044334810439977e-08, + "am": 1.9511351467826898e-07, + "yi": 4.581727807817515e-06, + "lo": 7.026307002888643e-07, + "uz": 2.0319157467696414e-10, + "fo": 4.075073320564115e-06, + "ht": 0.0001349478989141062, + "ps": 2.838884540778963e-07, + "tk": 5.8224053356426e-10, + "nn": 0.0004747086495626718, + "mt": 3.1423587643075734e-07, + "sa": 2.4716568987059873e-06, + "lb": 4.894851457493132e-08, + "my": 6.461271823354764e-06, + "bo": 3.052088686672505e-06, + "tl": 8.343945978595002e-07, + "mg": 1.7280938902075604e-09, + "as": 2.3352028222234367e-07, + "tt": 2.362024353885772e-09, + "haw": 5.988276097923517e-05, + "ln": 3.0825005524093285e-05, + "ha": 5.3437370084452596e-09, + "ba": 5.260104574134061e-10, + "jw": 7.394534623017535e-05, + "su": 7.896352460790013e-10 + } +} \ No newline at end of file diff --git a/tests/expected/tiny_fr.cpu/bonjour_vous_allez_bien.mp3.words.json b/tests/expected/tiny_fr.cpu/bonjour_vous_allez_bien.mp3.words.json new file mode 100644 index 0000000000000000000000000000000000000000..adc9890af4a61ebbb4b7beeef62b7b6307ee0338 --- /dev/null +++ b/tests/expected/tiny_fr.cpu/bonjour_vous_allez_bien.mp3.words.json @@ -0,0 +1,190 @@ +{ + "text": " Bonjour! Est-ce que vous allez bien? Bonjour! Bonjour! Est-ce que vous allez bien?", + "segments": [ + { + "id": 0, + "seek": 0, + "start": 0.46, + "end": 0.68, + "text": " Bonjour!", + "tokens": [ + 25431, + 2298 + ], + "temperature": 0.0, + "avg_logprob": -0.7739177703857422, + "compression_ratio": 0.8181818181818182, + "no_speech_prob": 0.04250079020857811, + "confidence": 0.69, + "words": [ + { + "text": "Bonjour!", + "start": 0.46, + "end": 0.68, + "confidence": 0.69 + } + ] + }, + { + "id": 1, + "seek": 148, + "start": 1.86, + "end": 2.8, + "text": " Est-ce que vous allez bien?", + "tokens": [ + 50364, + 4410, + 12, + 384, + 631, + 2630, + 18146, + 3610, + 2506, + 50464 + ], + "temperature": 0.0, + "avg_logprob": -0.4815776131369851, + "compression_ratio": 0.7714285714285715, + "no_speech_prob": 0.04176269844174385, + "confidence": 0.632, + "words": [ + { + "text": "Est-ce", + "start": 1.86, + "end": 2.14, + "confidence": 0.548 + }, + { + "text": "que", + "start": 2.14, + "end": 2.18, + "confidence": 0.848 + }, + { + "text": "vous", + "start": 2.18, + "end": 2.34, + "confidence": 0.993 + }, + { + "text": "allez", + "start": 2.34, + "end": 2.48, + "confidence": 0.298 + }, + { + "text": "bien?", + "start": 2.48, + "end": 2.8, + "confidence": 0.979 + } + ] + }, + { + "id": 2, + "seek": 3148, + "start": 32.98, + "end": 33.16, + "text": " Bonjour!", + "tokens": [ + 25431, + 2298 + ], + "temperature": 0.0, + "avg_logprob": -0.34033950169881183, + "compression_ratio": 0.8181818181818182, + "no_speech_prob": 0.5495142936706543, + "confidence": 0.919, + "words": [ + { + "text": "Bonjour!", + "start": 32.98, + "end": 33.16, + "confidence": 0.919 + } + ] + }, + { + "id": 3, + "seek": 3348, + "start": 34.4, + "end": 34.61, + "text": " Bonjour!", + "tokens": [ + 25431, + 2298 + ], + "temperature": 0.0, + "avg_logprob": -0.23644089698791504, + "compression_ratio": 0.8181818181818182, + "no_speech_prob": 0.40533149242401123, + "confidence": 0.331, + "words": [ + { + "text": "Bonjour!", + "start": 34.4, + "end": 34.61, + "confidence": 0.331 + } + ] + }, + { + "id": 4, + "seek": 3448, + "start": 34.61, + "end": 35.34, + "text": " Est-ce que vous allez bien?", + "tokens": [ + 50364, + 4410, + 12, + 384, + 631, + 2630, + 18146, + 3610, + 2506, + 50464 + ], + "temperature": 0.0, + "avg_logprob": -0.17279924045909534, + "compression_ratio": 0.7714285714285715, + "no_speech_prob": 0.5867945551872253, + "confidence": 0.871, + "words": [ + { + "text": "Est-ce", + "start": 34.61, + "end": 34.66, + "confidence": 0.741 + }, + { + "text": "que", + "start": 34.66, + "end": 34.72, + "confidence": 0.979 + }, + { + "text": "vous", + "start": 34.72, + "end": 34.86, + "confidence": 0.999 + }, + { + "text": "allez", + "start": 34.86, + "end": 35.0, + "confidence": 0.959 + }, + { + "text": "bien?", + "start": 35.0, + "end": 35.34, + "confidence": 1.0 + } + ] + } + ], + "language": "fr" +} \ No newline at end of file diff --git a/tests/expected/tiny_fr.cpu/radio_short.mp3.words.json b/tests/expected/tiny_fr.cpu/radio_short.mp3.words.json new file mode 100644 index 0000000000000000000000000000000000000000..b1910cc5b3224406e946a7c50d9507d3dfe850fe --- /dev/null +++ b/tests/expected/tiny_fr.cpu/radio_short.mp3.words.json @@ -0,0 +1,104 @@ +{ + "text": "............", + "segments": [ + { + "id": 0, + "seek": 0, + "start": 0.08, + "end": 0.76, + "text": "...", + "tokens": [ + 50364, + 1097, + 50614 + ], + "temperature": 0.0, + "avg_logprob": -1.4265364408493042, + "compression_ratio": 0.2727272727272727, + "no_speech_prob": 0.5112143754959106, + "confidence": 0.224, + "words": [ + { + "text": "...", + "start": 0.08, + "end": 0.76, + "confidence": 0.224 + } + ] + }, + { + "id": 1, + "seek": 6000, + "start": 60.02, + "end": 69.4, + "text": "...", + "tokens": [ + 50364, + 1097, + 51714 + ], + "temperature": 0.0, + "avg_logprob": -0.973953366279602, + "compression_ratio": 0.2727272727272727, + "no_speech_prob": 0.8780310153961182, + "confidence": 0.466, + "words": [ + { + "text": "...", + "start": 60.02, + "end": 69.4, + "confidence": 0.466 + } + ] + }, + { + "id": 2, + "seek": 9000, + "start": 90.02, + "end": 90.24, + "text": "...", + "tokens": [ + 1097 + ], + "temperature": 0.0, + "avg_logprob": -0.8283956527709961, + "compression_ratio": 0.2727272727272727, + "no_speech_prob": 0.641629695892334, + "confidence": 0.842, + "words": [ + { + "text": "...", + "start": 90.02, + "end": 90.24, + "confidence": 0.842 + } + ] + }, + { + "id": 3, + "seek": 10500, + "start": 105.04, + "end": 117.76, + "text": "...", + "tokens": [ + 50364, + 1097, + 51714 + ], + "temperature": 0.0, + "avg_logprob": -0.728730320930481, + "compression_ratio": 0.2727272727272727, + "no_speech_prob": 0.25682491064071655, + "confidence": 0.764, + "words": [ + { + "text": "...", + "start": 105.04, + "end": 117.76, + "confidence": 0.764 + } + ] + } + ], + "language": "fr" +} \ No newline at end of file diff --git a/tests/expected/tiny_fr.cpu/smartphone.mp3.words.json b/tests/expected/tiny_fr.cpu/smartphone.mp3.words.json new file mode 100644 index 0000000000000000000000000000000000000000..f90643caf0519b49ba0cbc0381cd8d8ced1f218b --- /dev/null +++ b/tests/expected/tiny_fr.cpu/smartphone.mp3.words.json @@ -0,0 +1,5038 @@ +{ + "text": " C'est évidence que dit Nicolas. Mais je me l'étais jamais formulé comme ça. Ce qui fait la force du smartphone, c'est pas seulement la cumulation des fonctions, mais la manière dans quelques interagues entraîne. Et il est d'ailleurs, c'est la photo c'est hyper convaincant. Alors évidemment, il faudrait ajouter les interfaces les grand-attêtes qu'il a été beaucoup très souvent ementionné. Mais bon, il faudrait que les profites aussi de 20 ans pendant l'été, les ordinateurs nous ont appris à piquer sur des icônes. C'est ce que le smartphone ajoute le toucher, qui rend le contact plus direct, plus sensible. Et puis, évidemment, il faudrait parler aussi des applications qui permettent de contourner le côté tout flu de la navigation web pour aller directement en but. Bref, tout ça, ce sont les conditions qui permettent de créer cette objet, en Nicolas, dit qu'il est très fondablement inédit dans l'histoire de l'humanité. Mais ça s'assoulait d'une autre interrogation. Est-ce que le fait que cette objet soit inédit un d'huies que notre rapport a lui est aussi un rapport inédit? Je veux dire, est-ce que le rapport qu'on a au sein de foi n'est comparable à celui qu'on entretenait à d'autres objectes techniques comme la voiture ou le téléphone? Il n'y a pas d'équivalent. On s'est espécie de nous voter dans la relation à l'objet. C'est facilement éterréciant parce qu'on a impression de, comme le 10, les utilisateurs et les efforts, elles aident dépendant de cette objet d'un lieu, en fait, une espèce de relation de médiation avec le monde qui rendent un peu avec la même sédiforme de le jeu. Donc, à objets inédits, rapport inédits. Et, ce rapport, si j'en prends Nicolas, frère caractérisée par un mélange de dépenses et de rojets. Bon, en vrai, il faudrait remonter très très finement toute l'histoire des objectes techniques et de leur infération dans le vie pour déterminer si ce rapport est totalement inédit. Mais j'ai l'impression comme ça que Nicolas se trompe pas vraiment. Pour autant, je sache. Il y a eu plein de discussions autour de la voiture ou même du téléphone. Mais la dépense n'était pas du même mort, donc le rejet n'en plus n'était pas du même mort. On peut adorer sa bagnure, en avoir besoin pour plein de choses. Et là, le soir, quand on va se coucher, on la laisse. On l'a pas dans la main, quand on est collis, quand on n'en mène pas au chiot. On pouvait être émervé par son mome qui occupeait la ligne de téléphone pendant une heure chaque soir pour discuter avec un copain. Mais ça ne ressemble pas à ce qu'on peut ressentir à voir même mome aujourd'hui continuuellement avec son smartphone dans la main, comme c'était une sorte de estimateur extère de l'intempis de lâcher à l'éantrénée, ça m'a eu immédiate. Bon, je dis ça pour le mome, mais évidemment, va là pour nos aussi. Donc, rapport immédiate d'accord. Mais pourquoi, à ton impression qu'on en sortira jamais? Et puis, il faut en remettre la faute sur les gens qui ont créé cette route merveilleux et diabolique, qui a dit à bollique par coeur, merveilleux. Les économistes parlent de dépendance du santé. Ces vidéos, en fait, on est un santé qui a été établie, c'est un soit mon termine, soit définissant des beurs, on définisse un signalétique.", + "segments": [ + { + "id": 0, + "seek": 0, + "start": 0.42, + "end": 1.38, + "text": " C'est évidence que dit Nicolas.", + "tokens": [ + 383, + 6, + 377, + 20090, + 2778, + 631, + 6176, + 38268, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.566579490710216, + "compression_ratio": 1.605421686746988, + "no_speech_prob": 0.14170263707637787, + "confidence": 0.625, + "words": [ + { + "text": "C'est", + "start": 0.42, + "end": 0.66, + "confidence": 0.849 + }, + { + "text": "évidence", + "start": 0.66, + "end": 0.94, + "confidence": 0.368 + }, + { + "text": "que", + "start": 0.94, + "end": 1.06, + "confidence": 0.883 + }, + { + "text": "dit", + "start": 1.06, + "end": 1.16, + "confidence": 0.344 + }, + { + "text": "Nicolas.", + "start": 1.16, + "end": 1.38, + "confidence": 0.921 + } + ] + }, + { + "id": 1, + "seek": 0, + "start": 1.66, + "end": 3.62, + "text": " Mais je me l'étais jamais formulé comme ça.", + "tokens": [ + 6313, + 1506, + 385, + 287, + 6, + 22824, + 14540, + 1254, + 425, + 526, + 5173, + 2788, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.566579490710216, + "compression_ratio": 1.605421686746988, + "no_speech_prob": 0.14170263707637787, + "confidence": 0.745, + "words": [ + { + "text": "Mais", + "start": 1.66, + "end": 1.9, + "confidence": 0.956 + }, + { + "text": "je", + "start": 1.9, + "end": 2.18, + "confidence": 0.629 + }, + { + "text": "me", + "start": 2.18, + "end": 2.3, + "confidence": 0.943 + }, + { + "text": "l'étais", + "start": 2.3, + "end": 2.54, + "confidence": 0.708 + }, + { + "text": "jamais", + "start": 2.54, + "end": 2.78, + "confidence": 0.962 + }, + { + "text": "formulé", + "start": 2.78, + "end": 3.2, + "confidence": 0.541 + }, + { + "text": "comme", + "start": 3.2, + "end": 3.34, + "confidence": 0.975 + }, + { + "text": "ça.", + "start": 3.34, + "end": 3.62, + "confidence": 0.979 + } + ] + }, + { + "id": 2, + "seek": 0, + "start": 4.14, + "end": 8.82, + "text": " Ce qui fait la force du smartphone, c'est pas seulement la cumulation des fonctions, mais la manière", + "tokens": [ + 8257, + 1956, + 3887, + 635, + 3464, + 1581, + 13307, + 11, + 269, + 6, + 377, + 1736, + 27772, + 635, + 12713, + 2776, + 730, + 17290, + 3916, + 11, + 2420, + 635, + 22267 + ], + "temperature": 0.0, + "avg_logprob": -0.566579490710216, + "compression_ratio": 1.605421686746988, + "no_speech_prob": 0.14170263707637787, + "confidence": 0.762, + "words": [ + { + "text": "Ce", + "start": 4.14, + "end": 4.22, + "confidence": 0.39 + }, + { + "text": "qui", + "start": 4.22, + "end": 4.34, + "confidence": 0.934 + }, + { + "text": "fait", + "start": 4.34, + "end": 4.46, + "confidence": 0.735 + }, + { + "text": "la", + "start": 4.46, + "end": 4.56, + "confidence": 0.988 + }, + { + "text": "force", + "start": 4.56, + "end": 4.96, + "confidence": 0.933 + }, + { + "text": "du", + "start": 4.96, + "end": 5.16, + "confidence": 0.936 + }, + { + "text": "smartphone,", + "start": 5.16, + "end": 5.74, + "confidence": 0.909 + }, + { + "text": "c'est", + "start": 5.74, + "end": 6.12, + "confidence": 0.871 + }, + { + "text": "pas", + "start": 6.12, + "end": 6.2, + "confidence": 0.982 + }, + { + "text": "seulement", + "start": 6.2, + "end": 6.52, + "confidence": 0.991 + }, + { + "text": "la", + "start": 6.52, + "end": 6.76, + "confidence": 0.627 + }, + { + "text": "cumulation", + "start": 6.76, + "end": 7.18, + "confidence": 0.679 + }, + { + "text": "des", + "start": 7.18, + "end": 7.54, + "confidence": 0.752 + }, + { + "text": "fonctions,", + "start": 7.54, + "end": 8.1, + "confidence": 0.826 + }, + { + "text": "mais", + "start": 8.1, + "end": 8.42, + "confidence": 0.511 + }, + { + "text": "la", + "start": 8.42, + "end": 8.58, + "confidence": 0.717 + }, + { + "text": "manière", + "start": 8.58, + "end": 8.82, + "confidence": 0.457 + } + ] + }, + { + "id": 3, + "seek": 0, + "start": 8.9, + "end": 10.84, + "text": " dans quelques interagues entraîne.", + "tokens": [ + 2680, + 16597, + 728, + 559, + 1247, + 22284, + 24741, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.566579490710216, + "compression_ratio": 1.605421686746988, + "no_speech_prob": 0.14170263707637787, + "confidence": 0.3, + "words": [ + { + "text": "dans", + "start": 8.9, + "end": 9.04, + "confidence": 0.329 + }, + { + "text": "quelques", + "start": 9.04, + "end": 9.26, + "confidence": 0.282 + }, + { + "text": "interagues", + "start": 9.26, + "end": 10.18, + "confidence": 0.238 + }, + { + "text": "entraîne.", + "start": 10.18, + "end": 10.84, + "confidence": 0.421 + } + ] + }, + { + "id": 4, + "seek": 0, + "start": 11.04, + "end": 12.92, + "text": " Et il est d'ailleurs, c'est la photo c'est hyper convaincant.", + "tokens": [ + 3790, + 1930, + 871, + 274, + 6, + 19400, + 11, + 269, + 6, + 377, + 635, + 5052, + 269, + 6, + 377, + 9848, + 3754, + 491, + 66, + 394, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.566579490710216, + "compression_ratio": 1.605421686746988, + "no_speech_prob": 0.14170263707637787, + "confidence": 0.625, + "words": [ + { + "text": "Et", + "start": 11.04, + "end": 11.1, + "confidence": 0.394 + }, + { + "text": "il", + "start": 11.1, + "end": 11.24, + "confidence": 0.128 + }, + { + "text": "est", + "start": 11.24, + "end": 11.38, + "confidence": 0.237 + }, + { + "text": "d'ailleurs,", + "start": 11.38, + "end": 11.62, + "confidence": 0.904 + }, + { + "text": "c'est", + "start": 11.62, + "end": 11.78, + "confidence": 0.879 + }, + { + "text": "la", + "start": 11.78, + "end": 11.82, + "confidence": 0.968 + }, + { + "text": "photo", + "start": 11.82, + "end": 11.92, + "confidence": 0.811 + }, + { + "text": "c'est", + "start": 11.92, + "end": 12.18, + "confidence": 0.792 + }, + { + "text": "hyper", + "start": 12.18, + "end": 12.38, + "confidence": 0.939 + }, + { + "text": "convaincant.", + "start": 12.38, + "end": 12.92, + "confidence": 0.494 + } + ] + }, + { + "id": 5, + "seek": 0, + "start": 13.26, + "end": 18.03, + "text": " Alors évidemment, il faudrait ajouter les interfaces les grand-attêtes qu'il a été beaucoup", + "tokens": [ + 9946, + 24724, + 11, + 1930, + 38694, + 8645, + 17680, + 23985, + 1512, + 28416, + 1512, + 2697, + 12, + 1591, + 38262, + 421, + 6, + 388, + 257, + 8862, + 8796 + ], + "temperature": 0.0, + "avg_logprob": -0.566579490710216, + "compression_ratio": 1.605421686746988, + "no_speech_prob": 0.14170263707637787, + "confidence": 0.553, + "words": [ + { + "text": "Alors", + "start": 13.26, + "end": 13.48, + "confidence": 0.904 + }, + { + "text": "évidemment,", + "start": 13.48, + "end": 13.92, + "confidence": 0.785 + }, + { + "text": "il", + "start": 13.92, + "end": 14.4, + "confidence": 0.961 + }, + { + "text": "faudrait", + "start": 14.4, + "end": 14.76, + "confidence": 0.85 + }, + { + "text": "ajouter", + "start": 14.76, + "end": 15.38, + "confidence": 0.874 + }, + { + "text": "les", + "start": 15.38, + "end": 15.62, + "confidence": 0.933 + }, + { + "text": "interfaces", + "start": 15.62, + "end": 15.86, + "confidence": 0.359 + }, + { + "text": "les", + "start": 15.86, + "end": 16.5, + "confidence": 0.414 + }, + { + "text": "grand-attêtes", + "start": 16.5, + "end": 16.94, + "confidence": 0.178 + }, + { + "text": "qu'il", + "start": 16.94, + "end": 17.18, + "confidence": 0.632 + }, + { + "text": "a", + "start": 17.18, + "end": 17.24, + "confidence": 0.969 + }, + { + "text": "été", + "start": 17.24, + "end": 17.5, + "confidence": 0.957 + }, + { + "text": "beaucoup", + "start": 17.5, + "end": 18.03, + "confidence": 0.572 + } + ] + }, + { + "id": 6, + "seek": 0, + "start": 18.03, + "end": 19.26, + "text": " très souvent ementionné.", + "tokens": [ + 5732, + 20847, + 846, + 1251, + 15055, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.566579490710216, + "compression_ratio": 1.605421686746988, + "no_speech_prob": 0.14170263707637787, + "confidence": 0.541, + "words": [ + { + "text": "très", + "start": 18.03, + "end": 18.66, + "confidence": 0.959 + }, + { + "text": "souvent", + "start": 18.66, + "end": 18.82, + "confidence": 0.994 + }, + { + "text": "ementionné.", + "start": 18.82, + "end": 19.26, + "confidence": 0.365 + } + ] + }, + { + "id": 7, + "seek": 0, + "start": 19.86, + "end": 23.54, + "text": " Mais bon, il faudrait que les profites aussi de 20 ans pendant l'été, les ordinateurs", + "tokens": [ + 6313, + 4428, + 11, + 1930, + 38694, + 8645, + 631, + 1512, + 1740, + 3324, + 6212, + 368, + 945, + 1567, + 17338, + 287, + 6, + 21210, + 11, + 1512, + 4792, + 13923, + 2156 + ], + "temperature": 0.0, + "avg_logprob": -0.566579490710216, + "compression_ratio": 1.605421686746988, + "no_speech_prob": 0.14170263707637787, + "confidence": 0.648, + "words": [ + { + "text": "Mais", + "start": 19.86, + "end": 20.22, + "confidence": 0.975 + }, + { + "text": "bon,", + "start": 20.22, + "end": 20.56, + "confidence": 0.479 + }, + { + "text": "il", + "start": 20.56, + "end": 20.6, + "confidence": 0.978 + }, + { + "text": "faudrait", + "start": 20.6, + "end": 20.74, + "confidence": 0.753 + }, + { + "text": "que", + "start": 20.74, + "end": 20.92, + "confidence": 0.378 + }, + { + "text": "les", + "start": 20.92, + "end": 20.98, + "confidence": 0.182 + }, + { + "text": "profites", + "start": 20.98, + "end": 21.26, + "confidence": 0.622 + }, + { + "text": "aussi", + "start": 21.26, + "end": 21.7, + "confidence": 0.502 + }, + { + "text": "de", + "start": 21.7, + "end": 21.84, + "confidence": 0.468 + }, + { + "text": "20", + "start": 21.84, + "end": 22.08, + "confidence": 0.924 + }, + { + "text": "ans", + "start": 22.08, + "end": 22.28, + "confidence": 0.937 + }, + { + "text": "pendant", + "start": 22.28, + "end": 22.46, + "confidence": 0.903 + }, + { + "text": "l'été,", + "start": 22.46, + "end": 22.96, + "confidence": 0.499 + }, + { + "text": "les", + "start": 22.96, + "end": 23.04, + "confidence": 0.861 + }, + { + "text": "ordinateurs", + "start": 23.04, + "end": 23.54, + "confidence": 0.934 + } + ] + }, + { + "id": 8, + "seek": 0, + "start": 23.58, + "end": 25.26, + "text": " nous ont appris à piquer sur des icônes.", + "tokens": [ + 4666, + 6592, + 724, + 5714, + 1531, + 280, + 23909, + 1022, + 730, + 4376, + 2851, + 4081, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.566579490710216, + "compression_ratio": 1.605421686746988, + "no_speech_prob": 0.14170263707637787, + "confidence": 0.663, + "words": [ + { + "text": "nous", + "start": 23.58, + "end": 23.74, + "confidence": 0.833 + }, + { + "text": "ont", + "start": 23.74, + "end": 23.86, + "confidence": 0.976 + }, + { + "text": "appris", + "start": 23.86, + "end": 24.06, + "confidence": 0.947 + }, + { + "text": "à", + "start": 24.06, + "end": 24.24, + "confidence": 0.24 + }, + { + "text": "piquer", + "start": 24.24, + "end": 24.42, + "confidence": 0.45 + }, + { + "text": "sur", + "start": 24.42, + "end": 24.68, + "confidence": 0.749 + }, + { + "text": "des", + "start": 24.68, + "end": 24.8, + "confidence": 0.96 + }, + { + "text": "icônes.", + "start": 24.8, + "end": 25.26, + "confidence": 0.656 + } + ] + }, + { + "id": 9, + "seek": 2556, + "start": 25.58, + "end": 30.56, + "text": " C'est ce que le smartphone ajoute le toucher, qui rend le contact plus direct, plus sensible.", + "tokens": [ + 383, + 6, + 377, + 1769, + 631, + 476, + 13307, + 17680, + 14040, + 476, + 2557, + 260, + 11, + 1956, + 6125, + 476, + 3385, + 1804, + 2047, + 11, + 1804, + 25380, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.4095459938049316, + "compression_ratio": 1.7522658610271904, + "no_speech_prob": 0.0006256799097172916, + "confidence": 0.643, + "words": [ + { + "text": "C'est", + "start": 25.58, + "end": 25.66, + "confidence": 0.449 + }, + { + "text": "ce", + "start": 25.66, + "end": 25.72, + "confidence": 0.491 + }, + { + "text": "que", + "start": 25.72, + "end": 25.94, + "confidence": 0.935 + }, + { + "text": "le", + "start": 25.94, + "end": 26.6, + "confidence": 0.377 + }, + { + "text": "smartphone", + "start": 26.6, + "end": 26.86, + "confidence": 0.977 + }, + { + "text": "ajoute", + "start": 26.86, + "end": 27.42, + "confidence": 0.813 + }, + { + "text": "le", + "start": 27.42, + "end": 27.64, + "confidence": 0.957 + }, + { + "text": "toucher,", + "start": 27.64, + "end": 28.06, + "confidence": 0.73 + }, + { + "text": "qui", + "start": 28.06, + "end": 28.18, + "confidence": 0.209 + }, + { + "text": "rend", + "start": 28.18, + "end": 28.34, + "confidence": 0.877 + }, + { + "text": "le", + "start": 28.34, + "end": 28.68, + "confidence": 0.991 + }, + { + "text": "contact", + "start": 28.68, + "end": 28.96, + "confidence": 0.854 + }, + { + "text": "plus", + "start": 28.96, + "end": 29.48, + "confidence": 0.865 + }, + { + "text": "direct,", + "start": 29.48, + "end": 29.96, + "confidence": 0.692 + }, + { + "text": "plus", + "start": 29.96, + "end": 30.24, + "confidence": 0.928 + }, + { + "text": "sensible.", + "start": 30.24, + "end": 30.56, + "confidence": 0.332 + } + ] + }, + { + "id": 10, + "seek": 2556, + "start": 31.04, + "end": 34.34, + "text": " Et puis, évidemment, il faudrait parler aussi des applications qui permettent de contourner", + "tokens": [ + 3790, + 9093, + 11, + 24724, + 11, + 1930, + 38694, + 8645, + 16421, + 6212, + 730, + 5821, + 1956, + 21540, + 317, + 368, + 21234, + 1193 + ], + "temperature": 0.0, + "avg_logprob": -0.4095459938049316, + "compression_ratio": 1.7522658610271904, + "no_speech_prob": 0.0006256799097172916, + "confidence": 0.827, + "words": [ + { + "text": "Et", + "start": 31.04, + "end": 31.24, + "confidence": 0.914 + }, + { + "text": "puis,", + "start": 31.24, + "end": 31.34, + "confidence": 0.713 + }, + { + "text": "évidemment,", + "start": 31.34, + "end": 31.64, + "confidence": 0.378 + }, + { + "text": "il", + "start": 31.64, + "end": 31.78, + "confidence": 0.935 + }, + { + "text": "faudrait", + "start": 31.78, + "end": 31.88, + "confidence": 0.99 + }, + { + "text": "parler", + "start": 31.88, + "end": 32.12, + "confidence": 0.882 + }, + { + "text": "aussi", + "start": 32.12, + "end": 32.3, + "confidence": 0.889 + }, + { + "text": "des", + "start": 32.3, + "end": 32.44, + "confidence": 0.927 + }, + { + "text": "applications", + "start": 32.44, + "end": 32.78, + "confidence": 0.839 + }, + { + "text": "qui", + "start": 32.78, + "end": 33.16, + "confidence": 0.652 + }, + { + "text": "permettent", + "start": 33.16, + "end": 33.68, + "confidence": 0.951 + }, + { + "text": "de", + "start": 33.68, + "end": 33.9, + "confidence": 0.952 + }, + { + "text": "contourner", + "start": 33.9, + "end": 34.34, + "confidence": 0.787 + } + ] + }, + { + "id": 11, + "seek": 2556, + "start": 34.34, + "end": 37.72, + "text": " le côté tout flu de la navigation web pour aller directement en but.", + "tokens": [ + 476, + 18437, + 3486, + 5029, + 368, + 635, + 17346, + 3670, + 2016, + 8722, + 37297, + 465, + 457, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.4095459938049316, + "compression_ratio": 1.7522658610271904, + "no_speech_prob": 0.0006256799097172916, + "confidence": 0.766, + "words": [ + { + "text": "le", + "start": 34.34, + "end": 34.52, + "confidence": 0.989 + }, + { + "text": "côté", + "start": 34.52, + "end": 34.72, + "confidence": 0.983 + }, + { + "text": "tout", + "start": 34.72, + "end": 34.96, + "confidence": 0.954 + }, + { + "text": "flu", + "start": 34.96, + "end": 35.2, + "confidence": 0.548 + }, + { + "text": "de", + "start": 35.2, + "end": 35.42, + "confidence": 0.248 + }, + { + "text": "la", + "start": 35.42, + "end": 35.72, + "confidence": 0.902 + }, + { + "text": "navigation", + "start": 35.72, + "end": 36.04, + "confidence": 0.913 + }, + { + "text": "web", + "start": 36.04, + "end": 36.64, + "confidence": 0.93 + }, + { + "text": "pour", + "start": 36.64, + "end": 36.76, + "confidence": 0.746 + }, + { + "text": "aller", + "start": 36.76, + "end": 36.94, + "confidence": 0.992 + }, + { + "text": "directement", + "start": 36.94, + "end": 37.46, + "confidence": 0.986 + }, + { + "text": "en", + "start": 37.46, + "end": 37.68, + "confidence": 0.644 + }, + { + "text": "but.", + "start": 37.68, + "end": 37.72, + "confidence": 0.689 + } + ] + }, + { + "id": 12, + "seek": 2556, + "start": 37.72, + "end": 43.06, + "text": " Bref, tout ça, ce sont les conditions qui permettent de créer cette objet, en Nicolas,", + "tokens": [ + 49957, + 11, + 3486, + 2788, + 11, + 1769, + 4900, + 1512, + 4487, + 1956, + 21540, + 317, + 368, + 32062, + 5550, + 14964, + 11, + 465, + 38268, + 11 + ], + "temperature": 0.0, + "avg_logprob": -0.4095459938049316, + "compression_ratio": 1.7522658610271904, + "no_speech_prob": 0.0006256799097172916, + "confidence": 0.725, + "words": [ + { + "text": "Bref,", + "start": 37.72, + "end": 38.9, + "confidence": 0.967 + }, + { + "text": "tout", + "start": 38.9, + "end": 38.98, + "confidence": 0.786 + }, + { + "text": "ça,", + "start": 38.98, + "end": 39.36, + "confidence": 0.985 + }, + { + "text": "ce", + "start": 39.36, + "end": 39.68, + "confidence": 0.929 + }, + { + "text": "sont", + "start": 39.68, + "end": 39.84, + "confidence": 0.963 + }, + { + "text": "les", + "start": 39.84, + "end": 40.06, + "confidence": 0.976 + }, + { + "text": "conditions", + "start": 40.06, + "end": 40.54, + "confidence": 0.96 + }, + { + "text": "qui", + "start": 40.54, + "end": 40.9, + "confidence": 0.995 + }, + { + "text": "permettent", + "start": 40.9, + "end": 41.54, + "confidence": 0.986 + }, + { + "text": "de", + "start": 41.54, + "end": 41.58, + "confidence": 0.989 + }, + { + "text": "créer", + "start": 41.58, + "end": 41.92, + "confidence": 0.918 + }, + { + "text": "cette", + "start": 41.92, + "end": 42.3, + "confidence": 0.518 + }, + { + "text": "objet,", + "start": 42.3, + "end": 42.7, + "confidence": 0.213 + }, + { + "text": "en", + "start": 42.7, + "end": 42.8, + "confidence": 0.191 + }, + { + "text": "Nicolas,", + "start": 42.8, + "end": 43.06, + "confidence": 0.508 + } + ] + }, + { + "id": 13, + "seek": 2556, + "start": 43.1, + "end": 46.48, + "text": " dit qu'il est très fondablement inédit dans l'histoire de l'humanité.", + "tokens": [ + 6176, + 421, + 6, + 388, + 871, + 5732, + 9557, + 712, + 518, + 294, + 7811, + 270, + 2680, + 287, + 6, + 29093, + 368, + 287, + 6, + 18796, + 5066, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.4095459938049316, + "compression_ratio": 1.7522658610271904, + "no_speech_prob": 0.0006256799097172916, + "confidence": 0.768, + "words": [ + { + "text": "dit", + "start": 43.1, + "end": 43.52, + "confidence": 0.551 + }, + { + "text": "qu'il", + "start": 43.52, + "end": 43.68, + "confidence": 0.969 + }, + { + "text": "est", + "start": 43.68, + "end": 43.8, + "confidence": 0.851 + }, + { + "text": "très", + "start": 43.8, + "end": 43.94, + "confidence": 0.368 + }, + { + "text": "fondablement", + "start": 43.94, + "end": 44.68, + "confidence": 0.593 + }, + { + "text": "inédit", + "start": 44.68, + "end": 45.52, + "confidence": 0.66 + }, + { + "text": "dans", + "start": 45.52, + "end": 45.74, + "confidence": 0.778 + }, + { + "text": "l'histoire", + "start": 45.74, + "end": 45.98, + "confidence": 0.825 + }, + { + "text": "de", + "start": 45.98, + "end": 46.08, + "confidence": 0.978 + }, + { + "text": "l'humanité.", + "start": 46.08, + "end": 46.48, + "confidence": 0.991 + } + ] + }, + { + "id": 14, + "seek": 2556, + "start": 47.06, + "end": 48.76, + "text": " Mais ça s'assoulait d'une autre interrogation.", + "tokens": [ + 6313, + 2788, + 262, + 6, + 640, + 263, + 35235, + 274, + 6, + 2613, + 15081, + 24871, + 399, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.4095459938049316, + "compression_ratio": 1.7522658610271904, + "no_speech_prob": 0.0006256799097172916, + "confidence": 0.697, + "words": [ + { + "text": "Mais", + "start": 47.06, + "end": 47.16, + "confidence": 0.939 + }, + { + "text": "ça", + "start": 47.16, + "end": 47.46, + "confidence": 0.854 + }, + { + "text": "s'assoulait", + "start": 47.46, + "end": 47.78, + "confidence": 0.591 + }, + { + "text": "d'une", + "start": 47.78, + "end": 48.02, + "confidence": 0.619 + }, + { + "text": "autre", + "start": 48.02, + "end": 48.14, + "confidence": 0.966 + }, + { + "text": "interrogation.", + "start": 48.14, + "end": 48.76, + "confidence": 0.833 + } + ] + }, + { + "id": 15, + "seek": 2556, + "start": 49.26, + "end": 54.34, + "text": " Est-ce que le fait que cette objet soit inédit un d'huies que notre rapport a lui est aussi", + "tokens": [ + 4410, + 12, + 384, + 631, + 476, + 3887, + 631, + 5550, + 14964, + 12703, + 294, + 7811, + 270, + 517, + 274, + 6, + 12086, + 530, + 631, + 10349, + 18018, + 257, + 8783, + 871, + 6212 + ], + "temperature": 0.0, + "avg_logprob": -0.4095459938049316, + "compression_ratio": 1.7522658610271904, + "no_speech_prob": 0.0006256799097172916, + "confidence": 0.697, + "words": [ + { + "text": "Est-ce", + "start": 49.26, + "end": 49.7, + "confidence": 0.804 + }, + { + "text": "que", + "start": 49.7, + "end": 49.74, + "confidence": 0.989 + }, + { + "text": "le", + "start": 49.74, + "end": 49.78, + "confidence": 0.882 + }, + { + "text": "fait", + "start": 49.78, + "end": 49.96, + "confidence": 0.962 + }, + { + "text": "que", + "start": 49.96, + "end": 50.08, + "confidence": 0.935 + }, + { + "text": "cette", + "start": 50.08, + "end": 50.24, + "confidence": 0.95 + }, + { + "text": "objet", + "start": 50.24, + "end": 50.5, + "confidence": 0.968 + }, + { + "text": "soit", + "start": 50.5, + "end": 50.96, + "confidence": 0.991 + }, + { + "text": "inédit", + "start": 50.96, + "end": 51.78, + "confidence": 0.91 + }, + { + "text": "un", + "start": 51.78, + "end": 52.06, + "confidence": 0.442 + }, + { + "text": "d'huies", + "start": 52.06, + "end": 52.32, + "confidence": 0.298 + }, + { + "text": "que", + "start": 52.32, + "end": 52.4, + "confidence": 0.966 + }, + { + "text": "notre", + "start": 52.4, + "end": 52.58, + "confidence": 0.992 + }, + { + "text": "rapport", + "start": 52.58, + "end": 53.1, + "confidence": 0.714 + }, + { + "text": "a", + "start": 53.1, + "end": 53.44, + "confidence": 0.522 + }, + { + "text": "lui", + "start": 53.44, + "end": 53.62, + "confidence": 0.659 + }, + { + "text": "est", + "start": 53.62, + "end": 54.0, + "confidence": 0.643 + }, + { + "text": "aussi", + "start": 54.0, + "end": 54.34, + "confidence": 0.808 + } + ] + }, + { + "id": 16, + "seek": 2556, + "start": 54.34, + "end": 55.32, + "text": " un rapport inédit?", + "tokens": [ + 517, + 18018, + 294, + 7811, + 270, + 2506 + ], + "temperature": 0.0, + "avg_logprob": -0.4095459938049316, + "compression_ratio": 1.7522658610271904, + "no_speech_prob": 0.0006256799097172916, + "confidence": 0.849, + "words": [ + { + "text": "un", + "start": 54.34, + "end": 54.72, + "confidence": 0.506 + }, + { + "text": "rapport", + "start": 54.72, + "end": 54.94, + "confidence": 0.999 + }, + { + "text": "inédit?", + "start": 54.94, + "end": 55.32, + "confidence": 0.956 + } + ] + }, + { + "id": 17, + "seek": 5548, + "start": 55.6, + "end": 58.6, + "text": " Je veux dire, est-ce que le rapport qu'on a au sein de foi n'est comparable à celui", + "tokens": [ + 2588, + 16389, + 1264, + 11, + 871, + 12, + 384, + 631, + 476, + 18018, + 421, + 6, + 266, + 257, + 1609, + 6195, + 368, + 6901, + 297, + 6, + 377, + 6311, + 712, + 1531, + 22829 + ], + "temperature": 0.0, + "avg_logprob": -0.6093524909167556, + "compression_ratio": 1.6292834890965733, + "no_speech_prob": 6.752492481609806e-05, + "confidence": 0.626, + "words": [ + { + "text": "Je", + "start": 55.6, + "end": 55.84, + "confidence": 0.335 + }, + { + "text": "veux", + "start": 55.84, + "end": 55.94, + "confidence": 0.432 + }, + { + "text": "dire,", + "start": 55.94, + "end": 56.16, + "confidence": 0.992 + }, + { + "text": "est-ce", + "start": 56.16, + "end": 56.34, + "confidence": 0.951 + }, + { + "text": "que", + "start": 56.34, + "end": 56.4, + "confidence": 0.973 + }, + { + "text": "le", + "start": 56.4, + "end": 56.54, + "confidence": 0.987 + }, + { + "text": "rapport", + "start": 56.54, + "end": 56.76, + "confidence": 0.999 + }, + { + "text": "qu'on", + "start": 56.76, + "end": 57.1, + "confidence": 0.906 + }, + { + "text": "a", + "start": 57.1, + "end": 57.14, + "confidence": 0.974 + }, + { + "text": "au", + "start": 57.14, + "end": 57.26, + "confidence": 0.319 + }, + { + "text": "sein", + "start": 57.26, + "end": 57.36, + "confidence": 0.244 + }, + { + "text": "de", + "start": 57.36, + "end": 57.44, + "confidence": 0.177 + }, + { + "text": "foi", + "start": 57.44, + "end": 57.54, + "confidence": 0.163 + }, + { + "text": "n'est", + "start": 57.54, + "end": 57.78, + "confidence": 0.777 + }, + { + "text": "comparable", + "start": 57.78, + "end": 58.32, + "confidence": 0.606 + }, + { + "text": "à", + "start": 58.32, + "end": 58.46, + "confidence": 0.482 + }, + { + "text": "celui", + "start": 58.46, + "end": 58.6, + "confidence": 0.831 + } + ] + }, + { + "id": 18, + "seek": 5548, + "start": 58.72, + "end": 62.81, + "text": " qu'on entretenait à d'autres objectes techniques comme la voiture ou le téléphone?", + "tokens": [ + 421, + 6, + 266, + 3962, + 1147, + 1001, + 1531, + 274, + 6, + 16752, + 2657, + 279, + 7512, + 5173, + 635, + 38859, + 2820, + 476, + 47159, + 2506 + ], + "temperature": 0.0, + "avg_logprob": -0.6093524909167556, + "compression_ratio": 1.6292834890965733, + "no_speech_prob": 6.752492481609806e-05, + "confidence": 0.781, + "words": [ + { + "text": "qu'on", + "start": 58.72, + "end": 58.88, + "confidence": 0.941 + }, + { + "text": "entretenait", + "start": 58.88, + "end": 59.38, + "confidence": 0.657 + }, + { + "text": "à", + "start": 59.38, + "end": 59.44, + "confidence": 0.973 + }, + { + "text": "d'autres", + "start": 59.44, + "end": 59.64, + "confidence": 0.909 + }, + { + "text": "objectes", + "start": 59.64, + "end": 60.02, + "confidence": 0.528 + }, + { + "text": "techniques", + "start": 60.02, + "end": 60.38, + "confidence": 0.547 + }, + { + "text": "comme", + "start": 60.38, + "end": 60.86, + "confidence": 0.662 + }, + { + "text": "la", + "start": 60.86, + "end": 61.46, + "confidence": 0.898 + }, + { + "text": "voiture", + "start": 61.46, + "end": 61.8, + "confidence": 0.954 + }, + { + "text": "ou", + "start": 61.8, + "end": 62.32, + "confidence": 0.74 + }, + { + "text": "le", + "start": 62.32, + "end": 62.6, + "confidence": 0.847 + }, + { + "text": "téléphone?", + "start": 62.6, + "end": 62.81, + "confidence": 0.979 + } + ] + }, + { + "id": 19, + "seek": 5548, + "start": 62.81, + "end": 66.07, + "text": " Il n'y a pas d'équivalent.", + "tokens": [ + 4416, + 297, + 6, + 88, + 257, + 1736, + 274, + 6, + 20183, + 3576, + 317, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.6093524909167556, + "compression_ratio": 1.6292834890965733, + "no_speech_prob": 6.752492481609806e-05, + "confidence": 0.882, + "words": [ + { + "text": "Il", + "start": 62.81, + "end": 65.42, + "confidence": 0.866 + }, + { + "text": "n'y", + "start": 65.42, + "end": 65.52, + "confidence": 0.865 + }, + { + "text": "a", + "start": 65.52, + "end": 65.56, + "confidence": 0.965 + }, + { + "text": "pas", + "start": 65.56, + "end": 65.62, + "confidence": 0.998 + }, + { + "text": "d'équivalent.", + "start": 65.62, + "end": 66.07, + "confidence": 0.858 + } + ] + }, + { + "id": 20, + "seek": 5548, + "start": 66.07, + "end": 69.74, + "text": " On s'est espécie de nous voter dans la relation à l'objet.", + "tokens": [ + 1282, + 262, + 6, + 377, + 7089, + 526, + 4260, + 368, + 4666, + 21722, + 2680, + 635, + 9721, + 1531, + 287, + 6, + 996, + 7108, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.6093524909167556, + "compression_ratio": 1.6292834890965733, + "no_speech_prob": 6.752492481609806e-05, + "confidence": 0.552, + "words": [ + { + "text": "On", + "start": 66.07, + "end": 67.0, + "confidence": 0.29 + }, + { + "text": "s'est", + "start": 67.0, + "end": 67.26, + "confidence": 0.562 + }, + { + "text": "espécie", + "start": 67.26, + "end": 67.46, + "confidence": 0.233 + }, + { + "text": "de", + "start": 67.46, + "end": 67.58, + "confidence": 0.963 + }, + { + "text": "nous", + "start": 67.58, + "end": 67.8, + "confidence": 0.631 + }, + { + "text": "voter", + "start": 67.8, + "end": 68.24, + "confidence": 0.241 + }, + { + "text": "dans", + "start": 68.24, + "end": 68.68, + "confidence": 0.853 + }, + { + "text": "la", + "start": 68.68, + "end": 68.88, + "confidence": 0.61 + }, + { + "text": "relation", + "start": 68.88, + "end": 69.22, + "confidence": 0.932 + }, + { + "text": "à", + "start": 69.22, + "end": 69.34, + "confidence": 0.792 + }, + { + "text": "l'objet.", + "start": 69.34, + "end": 69.74, + "confidence": 0.889 + } + ] + }, + { + "id": 21, + "seek": 5548, + "start": 70.18, + "end": 74.78, + "text": " C'est facilement éterréciant parce qu'on a impression de, comme le 10, les utilisateurs", + "tokens": [ + 383, + 6, + 377, + 23670, + 518, + 1136, + 391, + 10521, + 537, + 394, + 6992, + 421, + 6, + 266, + 257, + 9995, + 368, + 11, + 5173, + 476, + 1266, + 11, + 1512, + 33643, + 25929 + ], + "temperature": 0.0, + "avg_logprob": -0.6093524909167556, + "compression_ratio": 1.6292834890965733, + "no_speech_prob": 6.752492481609806e-05, + "confidence": 0.491, + "words": [ + { + "text": "C'est", + "start": 70.18, + "end": 70.34, + "confidence": 0.907 + }, + { + "text": "facilement", + "start": 70.34, + "end": 70.72, + "confidence": 0.527 + }, + { + "text": "éterréciant", + "start": 70.72, + "end": 71.56, + "confidence": 0.277 + }, + { + "text": "parce", + "start": 71.56, + "end": 71.82, + "confidence": 0.298 + }, + { + "text": "qu'on", + "start": 71.82, + "end": 72.3, + "confidence": 0.775 + }, + { + "text": "a", + "start": 72.3, + "end": 72.4, + "confidence": 0.563 + }, + { + "text": "impression", + "start": 72.4, + "end": 72.74, + "confidence": 0.148 + }, + { + "text": "de,", + "start": 72.74, + "end": 73.36, + "confidence": 0.211 + }, + { + "text": "comme", + "start": 73.36, + "end": 73.8, + "confidence": 0.843 + }, + { + "text": "le", + "start": 73.8, + "end": 73.96, + "confidence": 0.9 + }, + { + "text": "10,", + "start": 73.96, + "end": 74.28, + "confidence": 0.395 + }, + { + "text": "les", + "start": 74.28, + "end": 74.32, + "confidence": 0.581 + }, + { + "text": "utilisateurs", + "start": 74.32, + "end": 74.78, + "confidence": 0.745 + } + ] + }, + { + "id": 22, + "seek": 5548, + "start": 74.8, + "end": 77.93, + "text": " et les efforts, elles aident dépendant de cette objet d'un lieu, en fait, une espèce de", + "tokens": [ + 1030, + 1512, + 6484, + 11, + 23576, + 257, + 1078, + 45768, + 394, + 368, + 5550, + 14964, + 274, + 6, + 409, + 26036, + 11, + 465, + 3887, + 11, + 2251, + 7089, + 30236, + 368 + ], + "temperature": 0.0, + "avg_logprob": -0.6093524909167556, + "compression_ratio": 1.6292834890965733, + "no_speech_prob": 6.752492481609806e-05, + "confidence": 0.464, + "words": [ + { + "text": "et", + "start": 74.8, + "end": 74.92, + "confidence": 0.147 + }, + { + "text": "les", + "start": 74.92, + "end": 74.96, + "confidence": 0.242 + }, + { + "text": "efforts,", + "start": 74.96, + "end": 75.22, + "confidence": 0.108 + }, + { + "text": "elles", + "start": 75.22, + "end": 75.32, + "confidence": 0.108 + }, + { + "text": "aident", + "start": 75.32, + "end": 75.44, + "confidence": 0.289 + }, + { + "text": "dépendant", + "start": 75.44, + "end": 76.0, + "confidence": 0.576 + }, + { + "text": "de", + "start": 76.0, + "end": 76.16, + "confidence": 0.301 + }, + { + "text": "cette", + "start": 76.16, + "end": 76.2, + "confidence": 0.519 + }, + { + "text": "objet", + "start": 76.2, + "end": 76.48, + "confidence": 0.961 + }, + { + "text": "d'un", + "start": 76.48, + "end": 76.86, + "confidence": 0.883 + }, + { + "text": "lieu,", + "start": 76.86, + "end": 77.06, + "confidence": 0.333 + }, + { + "text": "en", + "start": 77.06, + "end": 77.18, + "confidence": 0.837 + }, + { + "text": "fait,", + "start": 77.18, + "end": 77.42, + "confidence": 0.958 + }, + { + "text": "une", + "start": 77.42, + "end": 77.46, + "confidence": 0.57 + }, + { + "text": "espèce", + "start": 77.46, + "end": 77.74, + "confidence": 0.961 + }, + { + "text": "de", + "start": 77.74, + "end": 77.93, + "confidence": 0.601 + } + ] + }, + { + "id": 23, + "seek": 5548, + "start": 77.93, + "end": 82.98, + "text": " relation de médiation avec le monde qui rendent un peu avec la même sédiforme de", + "tokens": [ + 9721, + 368, + 42436, + 399, + 4163, + 476, + 10431, + 1956, + 6125, + 317, + 517, + 5604, + 4163, + 635, + 5698, + 262, + 7811, + 8629, + 68, + 368 + ], + "temperature": 0.0, + "avg_logprob": -0.6093524909167556, + "compression_ratio": 1.6292834890965733, + "no_speech_prob": 6.752492481609806e-05, + "confidence": 0.556, + "words": [ + { + "text": "relation", + "start": 77.93, + "end": 78.32, + "confidence": 0.839 + }, + { + "text": "de", + "start": 78.32, + "end": 78.7, + "confidence": 0.723 + }, + { + "text": "médiation", + "start": 78.7, + "end": 79.4, + "confidence": 0.872 + }, + { + "text": "avec", + "start": 79.4, + "end": 79.74, + "confidence": 0.964 + }, + { + "text": "le", + "start": 79.74, + "end": 79.88, + "confidence": 0.985 + }, + { + "text": "monde", + "start": 79.88, + "end": 80.24, + "confidence": 0.909 + }, + { + "text": "qui", + "start": 80.24, + "end": 81.02, + "confidence": 0.871 + }, + { + "text": "rendent", + "start": 81.02, + "end": 81.74, + "confidence": 0.623 + }, + { + "text": "un", + "start": 81.74, + "end": 81.84, + "confidence": 0.224 + }, + { + "text": "peu", + "start": 81.84, + "end": 81.88, + "confidence": 0.223 + }, + { + "text": "avec", + "start": 81.88, + "end": 82.1, + "confidence": 0.863 + }, + { + "text": "la", + "start": 82.1, + "end": 82.24, + "confidence": 0.565 + }, + { + "text": "même", + "start": 82.24, + "end": 82.32, + "confidence": 0.384 + }, + { + "text": "sédiforme", + "start": 82.32, + "end": 82.86, + "confidence": 0.29 + }, + { + "text": "de", + "start": 82.86, + "end": 82.98, + "confidence": 0.899 + } + ] + }, + { + "id": 24, + "seek": 8298, + "start": 83.0, + "end": 87.66, + "text": " le jeu. Donc, à objets inédits, rapport inédits.", + "tokens": [ + 476, + 16748, + 13, + 7477, + 11, + 1531, + 1111, + 25349, + 294, + 7811, + 1208, + 11, + 18018, + 294, + 7811, + 1208, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.4346100035167876, + "compression_ratio": 1.5907335907335907, + "no_speech_prob": 3.121094050584361e-05, + "confidence": 0.614, + "words": [ + { + "text": "le", + "start": 83.0, + "end": 83.12, + "confidence": 0.128 + }, + { + "text": "jeu.", + "start": 83.12, + "end": 83.64, + "confidence": 0.505 + }, + { + "text": "Donc,", + "start": 83.64, + "end": 84.48, + "confidence": 0.513 + }, + { + "text": "à", + "start": 84.48, + "end": 84.86, + "confidence": 0.634 + }, + { + "text": "objets", + "start": 84.86, + "end": 85.36, + "confidence": 0.547 + }, + { + "text": "inédits,", + "start": 85.36, + "end": 86.24, + "confidence": 0.73 + }, + { + "text": "rapport", + "start": 86.24, + "end": 86.62, + "confidence": 0.928 + }, + { + "text": "inédits.", + "start": 86.62, + "end": 87.66, + "confidence": 0.921 + } + ] + }, + { + "id": 25, + "seek": 8298, + "start": 88.08, + "end": 93.78, + "text": " Et, ce rapport, si j'en prends Nicolas, frère caractérisée par un mélange de dépenses", + "tokens": [ + 3790, + 11, + 1769, + 18018, + 11, + 1511, + 361, + 6, + 268, + 46750, + 38268, + 11, + 431, + 4212, + 1032, + 578, + 4198, + 50027, + 971, + 517, + 41953, + 933, + 368, + 27998, + 9085 + ], + "temperature": 0.0, + "avg_logprob": -0.4346100035167876, + "compression_ratio": 1.5907335907335907, + "no_speech_prob": 3.121094050584361e-05, + "confidence": 0.624, + "words": [ + { + "text": "Et,", + "start": 88.08, + "end": 88.3, + "confidence": 0.87 + }, + { + "text": "ce", + "start": 88.3, + "end": 88.8, + "confidence": 0.462 + }, + { + "text": "rapport,", + "start": 88.8, + "end": 89.28, + "confidence": 0.997 + }, + { + "text": "si", + "start": 89.28, + "end": 89.56, + "confidence": 0.913 + }, + { + "text": "j'en", + "start": 89.56, + "end": 89.74, + "confidence": 0.771 + }, + { + "text": "prends", + "start": 89.74, + "end": 89.84, + "confidence": 0.313 + }, + { + "text": "Nicolas,", + "start": 89.84, + "end": 90.54, + "confidence": 0.358 + }, + { + "text": "frère", + "start": 90.54, + "end": 91.06, + "confidence": 0.405 + }, + { + "text": "caractérisée", + "start": 91.06, + "end": 91.7, + "confidence": 0.567 + }, + { + "text": "par", + "start": 91.7, + "end": 92.12, + "confidence": 0.868 + }, + { + "text": "un", + "start": 92.12, + "end": 92.32, + "confidence": 0.989 + }, + { + "text": "mélange", + "start": 92.32, + "end": 92.96, + "confidence": 0.932 + }, + { + "text": "de", + "start": 92.96, + "end": 93.24, + "confidence": 0.812 + }, + { + "text": "dépenses", + "start": 93.24, + "end": 93.78, + "confidence": 0.404 + } + ] + }, + { + "id": 26, + "seek": 8298, + "start": 94.36, + "end": 94.98, + "text": " et de rojets.", + "tokens": [ + 1030, + 368, + 744, + 73, + 1385, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.4346100035167876, + "compression_ratio": 1.5907335907335907, + "no_speech_prob": 3.121094050584361e-05, + "confidence": 0.583, + "words": [ + { + "text": "et", + "start": 94.36, + "end": 94.52, + "confidence": 0.986 + }, + { + "text": "de", + "start": 94.52, + "end": 94.56, + "confidence": 0.996 + }, + { + "text": "rojets.", + "start": 94.56, + "end": 94.98, + "confidence": 0.41 + } + ] + }, + { + "id": 27, + "seek": 8298, + "start": 95.8, + "end": 100.4, + "text": " Bon, en vrai, il faudrait remonter très très finement toute l'histoire des objectes", + "tokens": [ + 7368, + 11, + 465, + 17815, + 11, + 1930, + 38694, + 8645, + 890, + 41806, + 5732, + 5732, + 962, + 1712, + 14953, + 287, + 6, + 29093, + 730, + 2657, + 279 + ], + "temperature": 0.0, + "avg_logprob": -0.4346100035167876, + "compression_ratio": 1.5907335907335907, + "no_speech_prob": 3.121094050584361e-05, + "confidence": 0.749, + "words": [ + { + "text": "Bon,", + "start": 95.8, + "end": 96.06, + "confidence": 0.71 + }, + { + "text": "en", + "start": 96.06, + "end": 96.54, + "confidence": 0.92 + }, + { + "text": "vrai,", + "start": 96.54, + "end": 96.88, + "confidence": 0.994 + }, + { + "text": "il", + "start": 96.88, + "end": 97.1, + "confidence": 0.985 + }, + { + "text": "faudrait", + "start": 97.1, + "end": 97.5, + "confidence": 0.932 + }, + { + "text": "remonter", + "start": 97.5, + "end": 98.02, + "confidence": 0.574 + }, + { + "text": "très", + "start": 98.02, + "end": 98.46, + "confidence": 0.984 + }, + { + "text": "très", + "start": 98.46, + "end": 98.76, + "confidence": 0.597 + }, + { + "text": "finement", + "start": 98.76, + "end": 99.36, + "confidence": 0.476 + }, + { + "text": "toute", + "start": 99.36, + "end": 99.68, + "confidence": 0.367 + }, + { + "text": "l'histoire", + "start": 99.68, + "end": 100.02, + "confidence": 0.909 + }, + { + "text": "des", + "start": 100.02, + "end": 100.2, + "confidence": 0.949 + }, + { + "text": "objectes", + "start": 100.2, + "end": 100.4, + "confidence": 0.805 + } + ] + }, + { + "id": 28, + "seek": 8298, + "start": 100.4, + "end": 105.14, + "text": " techniques et de leur infération dans le vie pour déterminer si ce rapport est totalement", + "tokens": [ + 7512, + 1030, + 368, + 9580, + 1536, + 526, + 2405, + 2680, + 476, + 4941, + 2016, + 2795, + 29725, + 260, + 1511, + 1769, + 18018, + 871, + 45203 + ], + "temperature": 0.0, + "avg_logprob": -0.4346100035167876, + "compression_ratio": 1.5907335907335907, + "no_speech_prob": 3.121094050584361e-05, + "confidence": 0.665, + "words": [ + { + "text": "techniques", + "start": 100.4, + "end": 101.02, + "confidence": 0.954 + }, + { + "text": "et", + "start": 101.02, + "end": 101.52, + "confidence": 0.967 + }, + { + "text": "de", + "start": 101.52, + "end": 101.64, + "confidence": 0.973 + }, + { + "text": "leur", + "start": 101.64, + "end": 101.78, + "confidence": 0.811 + }, + { + "text": "infération", + "start": 101.78, + "end": 102.22, + "confidence": 0.227 + }, + { + "text": "dans", + "start": 102.22, + "end": 102.46, + "confidence": 0.518 + }, + { + "text": "le", + "start": 102.46, + "end": 102.54, + "confidence": 0.511 + }, + { + "text": "vie", + "start": 102.54, + "end": 102.78, + "confidence": 0.612 + }, + { + "text": "pour", + "start": 102.78, + "end": 103.06, + "confidence": 0.933 + }, + { + "text": "déterminer", + "start": 103.06, + "end": 103.64, + "confidence": 0.954 + }, + { + "text": "si", + "start": 103.64, + "end": 103.74, + "confidence": 0.488 + }, + { + "text": "ce", + "start": 103.74, + "end": 103.86, + "confidence": 0.98 + }, + { + "text": "rapport", + "start": 103.86, + "end": 104.1, + "confidence": 0.997 + }, + { + "text": "est", + "start": 104.1, + "end": 104.88, + "confidence": 0.942 + }, + { + "text": "totalement", + "start": 104.88, + "end": 105.14, + "confidence": 0.854 + } + ] + }, + { + "id": 29, + "seek": 8298, + "start": 105.26, + "end": 105.78, + "text": " inédit.", + "tokens": [ + 294, + 7811, + 270, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.4346100035167876, + "compression_ratio": 1.5907335907335907, + "no_speech_prob": 3.121094050584361e-05, + "confidence": 0.943, + "words": [ + { + "text": "inédit.", + "start": 105.26, + "end": 105.78, + "confidence": 0.943 + } + ] + }, + { + "id": 30, + "seek": 8298, + "start": 106.14, + "end": 109.36, + "text": " Mais j'ai l'impression comme ça que Nicolas se trompe pas vraiment.", + "tokens": [ + 6313, + 361, + 6, + 1301, + 287, + 6, + 36107, + 5173, + 2788, + 631, + 38268, + 369, + 504, + 298, + 494, + 1736, + 8322, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.4346100035167876, + "compression_ratio": 1.5907335907335907, + "no_speech_prob": 3.121094050584361e-05, + "confidence": 0.798, + "words": [ + { + "text": "Mais", + "start": 106.14, + "end": 106.34, + "confidence": 0.872 + }, + { + "text": "j'ai", + "start": 106.34, + "end": 106.9, + "confidence": 0.924 + }, + { + "text": "l'impression", + "start": 106.9, + "end": 107.28, + "confidence": 0.967 + }, + { + "text": "comme", + "start": 107.28, + "end": 107.5, + "confidence": 0.709 + }, + { + "text": "ça", + "start": 107.5, + "end": 107.68, + "confidence": 0.955 + }, + { + "text": "que", + "start": 107.68, + "end": 107.96, + "confidence": 0.91 + }, + { + "text": "Nicolas", + "start": 107.96, + "end": 108.36, + "confidence": 0.986 + }, + { + "text": "se", + "start": 108.36, + "end": 108.66, + "confidence": 0.569 + }, + { + "text": "trompe", + "start": 108.66, + "end": 109.0, + "confidence": 0.532 + }, + { + "text": "pas", + "start": 109.0, + "end": 109.1, + "confidence": 0.715 + }, + { + "text": "vraiment.", + "start": 109.1, + "end": 109.36, + "confidence": 0.923 + } + ] + }, + { + "id": 31, + "seek": 10970, + "start": 109.72, + "end": 114.26, + "text": " Pour autant, je sache. Il y a eu plein de discussions autour de la voiture ou même", + "tokens": [ + 8732, + 34081, + 11, + 1506, + 262, + 6000, + 13, + 4416, + 288, + 257, + 2228, + 21088, + 368, + 11088, + 30249, + 368, + 635, + 38859, + 2820, + 5698 + ], + "temperature": 0.0, + "avg_logprob": -0.394765736144266, + "compression_ratio": 1.7249190938511327, + "no_speech_prob": 9.048193533089943e-06, + "confidence": 0.829, + "words": [ + { + "text": "Pour", + "start": 109.72, + "end": 110.08, + "confidence": 0.92 + }, + { + "text": "autant,", + "start": 110.08, + "end": 110.36, + "confidence": 0.986 + }, + { + "text": "je", + "start": 110.36, + "end": 110.4, + "confidence": 0.894 + }, + { + "text": "sache.", + "start": 110.4, + "end": 110.86, + "confidence": 0.531 + }, + { + "text": "Il", + "start": 110.86, + "end": 111.16, + "confidence": 0.851 + }, + { + "text": "y", + "start": 111.16, + "end": 111.22, + "confidence": 0.872 + }, + { + "text": "a", + "start": 111.22, + "end": 111.28, + "confidence": 0.939 + }, + { + "text": "eu", + "start": 111.28, + "end": 111.38, + "confidence": 0.891 + }, + { + "text": "plein", + "start": 111.38, + "end": 111.76, + "confidence": 0.833 + }, + { + "text": "de", + "start": 111.76, + "end": 112.04, + "confidence": 0.94 + }, + { + "text": "discussions", + "start": 112.04, + "end": 112.46, + "confidence": 0.711 + }, + { + "text": "autour", + "start": 112.46, + "end": 112.96, + "confidence": 0.97 + }, + { + "text": "de", + "start": 112.96, + "end": 113.46, + "confidence": 0.952 + }, + { + "text": "la", + "start": 113.46, + "end": 113.5, + "confidence": 0.955 + }, + { + "text": "voiture", + "start": 113.5, + "end": 113.8, + "confidence": 0.983 + }, + { + "text": "ou", + "start": 113.8, + "end": 114.02, + "confidence": 0.523 + }, + { + "text": "même", + "start": 114.02, + "end": 114.26, + "confidence": 0.963 + } + ] + }, + { + "id": 32, + "seek": 10970, + "start": 114.42, + "end": 118.76, + "text": " du téléphone. Mais la dépense n'était pas du même mort, donc le rejet n'en", + "tokens": [ + 1581, + 47159, + 13, + 6313, + 635, + 27998, + 1288, + 297, + 6, + 9743, + 1736, + 1581, + 5698, + 6599, + 11, + 5926, + 476, + 319, + 7108, + 297, + 6, + 268 + ], + "temperature": 0.0, + "avg_logprob": -0.394765736144266, + "compression_ratio": 1.7249190938511327, + "no_speech_prob": 9.048193533089943e-06, + "confidence": 0.732, + "words": [ + { + "text": "du", + "start": 114.42, + "end": 114.6, + "confidence": 0.677 + }, + { + "text": "téléphone.", + "start": 114.6, + "end": 115.16, + "confidence": 0.983 + }, + { + "text": "Mais", + "start": 115.16, + "end": 115.72, + "confidence": 0.649 + }, + { + "text": "la", + "start": 115.72, + "end": 116.0, + "confidence": 0.809 + }, + { + "text": "dépense", + "start": 116.0, + "end": 116.38, + "confidence": 0.766 + }, + { + "text": "n'était", + "start": 116.38, + "end": 116.62, + "confidence": 0.952 + }, + { + "text": "pas", + "start": 116.62, + "end": 117.02, + "confidence": 0.994 + }, + { + "text": "du", + "start": 117.02, + "end": 117.16, + "confidence": 0.98 + }, + { + "text": "même", + "start": 117.16, + "end": 117.32, + "confidence": 0.944 + }, + { + "text": "mort,", + "start": 117.32, + "end": 117.66, + "confidence": 0.519 + }, + { + "text": "donc", + "start": 117.66, + "end": 117.78, + "confidence": 0.871 + }, + { + "text": "le", + "start": 117.78, + "end": 118.32, + "confidence": 0.932 + }, + { + "text": "rejet", + "start": 118.32, + "end": 118.62, + "confidence": 0.524 + }, + { + "text": "n'en", + "start": 118.62, + "end": 118.76, + "confidence": 0.472 + } + ] + }, + { + "id": 33, + "seek": 10970, + "start": 118.76, + "end": 119.66, + "text": " plus n'était pas du même mort.", + "tokens": [ + 1804, + 297, + 6, + 9743, + 1736, + 1581, + 5698, + 6599, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.394765736144266, + "compression_ratio": 1.7249190938511327, + "no_speech_prob": 9.048193533089943e-06, + "confidence": 0.853, + "words": [ + { + "text": "plus", + "start": 118.76, + "end": 118.9, + "confidence": 0.313 + }, + { + "text": "n'était", + "start": 118.9, + "end": 119.1, + "confidence": 0.973 + }, + { + "text": "pas", + "start": 119.1, + "end": 119.26, + "confidence": 0.998 + }, + { + "text": "du", + "start": 119.26, + "end": 119.36, + "confidence": 0.988 + }, + { + "text": "même", + "start": 119.36, + "end": 119.5, + "confidence": 0.999 + }, + { + "text": "mort.", + "start": 119.5, + "end": 119.66, + "confidence": 0.984 + } + ] + }, + { + "id": 34, + "seek": 10970, + "start": 120.06, + "end": 122.94, + "text": " On peut adorer sa bagnure, en avoir besoin pour plein de choses.", + "tokens": [ + 1282, + 5977, + 614, + 17618, + 601, + 3411, + 77, + 540, + 11, + 465, + 10853, + 19207, + 2016, + 21088, + 368, + 14488, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.394765736144266, + "compression_ratio": 1.7249190938511327, + "no_speech_prob": 9.048193533089943e-06, + "confidence": 0.753, + "words": [ + { + "text": "On", + "start": 120.06, + "end": 120.22, + "confidence": 0.969 + }, + { + "text": "peut", + "start": 120.22, + "end": 120.32, + "confidence": 0.988 + }, + { + "text": "adorer", + "start": 120.32, + "end": 120.64, + "confidence": 0.854 + }, + { + "text": "sa", + "start": 120.64, + "end": 120.86, + "confidence": 0.918 + }, + { + "text": "bagnure,", + "start": 120.86, + "end": 121.38, + "confidence": 0.368 + }, + { + "text": "en", + "start": 121.38, + "end": 121.52, + "confidence": 0.56 + }, + { + "text": "avoir", + "start": 121.52, + "end": 121.66, + "confidence": 0.969 + }, + { + "text": "besoin", + "start": 121.66, + "end": 122.08, + "confidence": 0.997 + }, + { + "text": "pour", + "start": 122.08, + "end": 122.34, + "confidence": 0.92 + }, + { + "text": "plein", + "start": 122.34, + "end": 122.64, + "confidence": 0.9 + }, + { + "text": "de", + "start": 122.64, + "end": 122.78, + "confidence": 0.993 + }, + { + "text": "choses.", + "start": 122.78, + "end": 122.94, + "confidence": 0.994 + } + ] + }, + { + "id": 35, + "seek": 10970, + "start": 123.36, + "end": 126.38, + "text": " Et là, le soir, quand on va se coucher, on la laisse.", + "tokens": [ + 3790, + 3684, + 11, + 476, + 27105, + 11, + 6932, + 322, + 2773, + 369, + 1384, + 6759, + 11, + 322, + 635, + 30969, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.394765736144266, + "compression_ratio": 1.7249190938511327, + "no_speech_prob": 9.048193533089943e-06, + "confidence": 0.826, + "words": [ + { + "text": "Et", + "start": 123.36, + "end": 123.48, + "confidence": 0.557 + }, + { + "text": "là,", + "start": 123.48, + "end": 123.66, + "confidence": 0.527 + }, + { + "text": "le", + "start": 123.66, + "end": 124.02, + "confidence": 0.986 + }, + { + "text": "soir,", + "start": 124.02, + "end": 124.5, + "confidence": 0.966 + }, + { + "text": "quand", + "start": 124.5, + "end": 124.9, + "confidence": 0.774 + }, + { + "text": "on", + "start": 124.9, + "end": 125.02, + "confidence": 0.986 + }, + { + "text": "va", + "start": 125.02, + "end": 125.1, + "confidence": 0.968 + }, + { + "text": "se", + "start": 125.1, + "end": 125.2, + "confidence": 0.862 + }, + { + "text": "coucher,", + "start": 125.2, + "end": 125.64, + "confidence": 0.791 + }, + { + "text": "on", + "start": 125.64, + "end": 126.04, + "confidence": 0.974 + }, + { + "text": "la", + "start": 126.04, + "end": 126.12, + "confidence": 0.783 + }, + { + "text": "laisse.", + "start": 126.12, + "end": 126.38, + "confidence": 0.981 + } + ] + }, + { + "id": 36, + "seek": 10970, + "start": 127.06, + "end": 130.0, + "text": " On l'a pas dans la main, quand on est collis, quand on n'en mène pas au chiot.", + "tokens": [ + 1282, + 287, + 6, + 64, + 1736, + 2680, + 635, + 2135, + 11, + 6932, + 322, + 871, + 1263, + 271, + 11, + 6932, + 322, + 297, + 6, + 268, + 275, + 18832, + 1736, + 1609, + 417, + 6471, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.394765736144266, + "compression_ratio": 1.7249190938511327, + "no_speech_prob": 9.048193533089943e-06, + "confidence": 0.66, + "words": [ + { + "text": "On", + "start": 127.06, + "end": 127.3, + "confidence": 0.742 + }, + { + "text": "l'a", + "start": 127.3, + "end": 127.46, + "confidence": 0.714 + }, + { + "text": "pas", + "start": 127.46, + "end": 127.64, + "confidence": 0.99 + }, + { + "text": "dans", + "start": 127.64, + "end": 127.82, + "confidence": 0.967 + }, + { + "text": "la", + "start": 127.82, + "end": 127.94, + "confidence": 0.956 + }, + { + "text": "main,", + "start": 127.94, + "end": 128.3, + "confidence": 0.978 + }, + { + "text": "quand", + "start": 128.3, + "end": 128.44, + "confidence": 0.967 + }, + { + "text": "on", + "start": 128.44, + "end": 128.6, + "confidence": 0.993 + }, + { + "text": "est", + "start": 128.6, + "end": 128.66, + "confidence": 0.602 + }, + { + "text": "collis,", + "start": 128.66, + "end": 129.2, + "confidence": 0.346 + }, + { + "text": "quand", + "start": 129.2, + "end": 129.24, + "confidence": 0.524 + }, + { + "text": "on", + "start": 129.24, + "end": 129.32, + "confidence": 0.991 + }, + { + "text": "n'en", + "start": 129.32, + "end": 129.38, + "confidence": 0.537 + }, + { + "text": "mène", + "start": 129.38, + "end": 129.56, + "confidence": 0.434 + }, + { + "text": "pas", + "start": 129.56, + "end": 129.72, + "confidence": 0.998 + }, + { + "text": "au", + "start": 129.72, + "end": 129.82, + "confidence": 0.811 + }, + { + "text": "chiot.", + "start": 129.82, + "end": 130.0, + "confidence": 0.473 + } + ] + }, + { + "id": 37, + "seek": 10970, + "start": 130.88, + "end": 135.1, + "text": " On pouvait être émervé par son mome qui occupeait la ligne de téléphone pendant une", + "tokens": [ + 1282, + 45913, + 7418, + 1136, + 936, + 15797, + 971, + 1872, + 275, + 423, + 1956, + 2678, + 84, + 494, + 1001, + 635, + 34207, + 368, + 47159, + 17338, + 2251 + ], + "temperature": 0.0, + "avg_logprob": -0.394765736144266, + "compression_ratio": 1.7249190938511327, + "no_speech_prob": 9.048193533089943e-06, + "confidence": 0.672, + "words": [ + { + "text": "On", + "start": 130.88, + "end": 131.0, + "confidence": 0.991 + }, + { + "text": "pouvait", + "start": 131.0, + "end": 131.24, + "confidence": 0.532 + }, + { + "text": "être", + "start": 131.24, + "end": 131.7, + "confidence": 0.545 + }, + { + "text": "émervé", + "start": 131.7, + "end": 132.2, + "confidence": 0.725 + }, + { + "text": "par", + "start": 132.2, + "end": 132.42, + "confidence": 0.82 + }, + { + "text": "son", + "start": 132.42, + "end": 132.68, + "confidence": 0.448 + }, + { + "text": "mome", + "start": 132.68, + "end": 133.04, + "confidence": 0.261 + }, + { + "text": "qui", + "start": 133.04, + "end": 133.26, + "confidence": 0.901 + }, + { + "text": "occupeait", + "start": 133.26, + "end": 133.72, + "confidence": 0.641 + }, + { + "text": "la", + "start": 133.72, + "end": 133.8, + "confidence": 0.8 + }, + { + "text": "ligne", + "start": 133.8, + "end": 134.0, + "confidence": 0.976 + }, + { + "text": "de", + "start": 134.0, + "end": 134.14, + "confidence": 0.964 + }, + { + "text": "téléphone", + "start": 134.14, + "end": 134.44, + "confidence": 0.977 + }, + { + "text": "pendant", + "start": 134.44, + "end": 134.8, + "confidence": 0.92 + }, + { + "text": "une", + "start": 134.8, + "end": 135.1, + "confidence": 0.838 + } + ] + }, + { + "id": 38, + "seek": 10970, + "start": 135.1, + "end": 136.84, + "text": " heure chaque soir pour discuter avec un copain.", + "tokens": [ + 30027, + 18920, + 27105, + 2016, + 2983, + 20314, + 4163, + 517, + 2971, + 491, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.394765736144266, + "compression_ratio": 1.7249190938511327, + "no_speech_prob": 9.048193533089943e-06, + "confidence": 0.922, + "words": [ + { + "text": "heure", + "start": 135.1, + "end": 135.36, + "confidence": 0.701 + }, + { + "text": "chaque", + "start": 135.36, + "end": 135.52, + "confidence": 0.957 + }, + { + "text": "soir", + "start": 135.52, + "end": 135.76, + "confidence": 0.997 + }, + { + "text": "pour", + "start": 135.76, + "end": 135.94, + "confidence": 0.983 + }, + { + "text": "discuter", + "start": 135.94, + "end": 136.26, + "confidence": 0.882 + }, + { + "text": "avec", + "start": 136.26, + "end": 136.44, + "confidence": 0.993 + }, + { + "text": "un", + "start": 136.44, + "end": 136.6, + "confidence": 0.976 + }, + { + "text": "copain.", + "start": 136.6, + "end": 136.84, + "confidence": 0.948 + } + ] + }, + { + "id": 39, + "seek": 13702, + "start": 137.26, + "end": 141.8, + "text": " Mais ça ne ressemble pas à ce qu'on peut ressentir à voir même mome aujourd'hui", + "tokens": [ + 6313, + 2788, + 408, + 725, + 37227, + 1736, + 1531, + 1769, + 421, + 6, + 266, + 5977, + 24689, + 317, + 347, + 1531, + 10695, + 5698, + 275, + 423, + 14023, + 6, + 10556 + ], + "temperature": 0.0, + "avg_logprob": -0.5734858703613281, + "compression_ratio": 1.5562700964630225, + "no_speech_prob": 3.1260256037057843e-06, + "confidence": 0.716, + "words": [ + { + "text": "Mais", + "start": 137.26, + "end": 137.52, + "confidence": 0.967 + }, + { + "text": "ça", + "start": 137.52, + "end": 137.6, + "confidence": 0.859 + }, + { + "text": "ne", + "start": 137.6, + "end": 137.68, + "confidence": 0.681 + }, + { + "text": "ressemble", + "start": 137.68, + "end": 138.14, + "confidence": 0.743 + }, + { + "text": "pas", + "start": 138.14, + "end": 138.66, + "confidence": 0.524 + }, + { + "text": "à", + "start": 138.66, + "end": 138.94, + "confidence": 0.978 + }, + { + "text": "ce", + "start": 138.94, + "end": 139.02, + "confidence": 0.605 + }, + { + "text": "qu'on", + "start": 139.02, + "end": 139.16, + "confidence": 0.961 + }, + { + "text": "peut", + "start": 139.16, + "end": 139.3, + "confidence": 0.586 + }, + { + "text": "ressentir", + "start": 139.3, + "end": 140.04, + "confidence": 0.898 + }, + { + "text": "à", + "start": 140.04, + "end": 140.24, + "confidence": 0.352 + }, + { + "text": "voir", + "start": 140.24, + "end": 140.48, + "confidence": 0.918 + }, + { + "text": "même", + "start": 140.48, + "end": 140.86, + "confidence": 0.324 + }, + { + "text": "mome", + "start": 140.86, + "end": 141.18, + "confidence": 0.374 + }, + { + "text": "aujourd'hui", + "start": 141.18, + "end": 141.8, + "confidence": 0.949 + } + ] + }, + { + "id": 40, + "seek": 13702, + "start": 141.92, + "end": 145.76, + "text": " continuuellement avec son smartphone dans la main, comme c'était une sorte de estimateur", + "tokens": [ + 2993, + 31816, + 4163, + 1872, + 13307, + 2680, + 635, + 2135, + 11, + 5173, + 269, + 6, + 9743, + 2251, + 25559, + 368, + 8017, + 15540 + ], + "temperature": 0.0, + "avg_logprob": -0.5734858703613281, + "compression_ratio": 1.5562700964630225, + "no_speech_prob": 3.1260256037057843e-06, + "confidence": 0.584, + "words": [ + { + "text": "continuuellement", + "start": 141.92, + "end": 142.8, + "confidence": 0.327 + }, + { + "text": "avec", + "start": 142.8, + "end": 143.18, + "confidence": 0.903 + }, + { + "text": "son", + "start": 143.18, + "end": 143.36, + "confidence": 0.866 + }, + { + "text": "smartphone", + "start": 143.36, + "end": 143.64, + "confidence": 0.467 + }, + { + "text": "dans", + "start": 143.64, + "end": 143.92, + "confidence": 0.554 + }, + { + "text": "la", + "start": 143.92, + "end": 144.0, + "confidence": 0.972 + }, + { + "text": "main,", + "start": 144.0, + "end": 144.26, + "confidence": 0.997 + }, + { + "text": "comme", + "start": 144.26, + "end": 144.52, + "confidence": 0.95 + }, + { + "text": "c'était", + "start": 144.52, + "end": 144.78, + "confidence": 0.574 + }, + { + "text": "une", + "start": 144.78, + "end": 144.94, + "confidence": 0.971 + }, + { + "text": "sorte", + "start": 144.94, + "end": 145.1, + "confidence": 0.642 + }, + { + "text": "de", + "start": 145.1, + "end": 145.18, + "confidence": 0.268 + }, + { + "text": "estimateur", + "start": 145.18, + "end": 145.76, + "confidence": 0.415 + } + ] + }, + { + "id": 41, + "seek": 13702, + "start": 145.94, + "end": 148.88, + "text": " extère de l'intempis de lâcher à l'éantrénée, ça m'a eu immédiate.", + "tokens": [ + 1279, + 4212, + 368, + 287, + 6, + 686, + 15970, + 271, + 368, + 48835, + 6759, + 1531, + 287, + 6, + 526, + 394, + 81, + 3516, + 3856, + 11, + 2788, + 275, + 6, + 64, + 2228, + 3397, + 526, + 4504, + 473, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.5734858703613281, + "compression_ratio": 1.5562700964630225, + "no_speech_prob": 3.1260256037057843e-06, + "confidence": 0.401, + "words": [ + { + "text": "extère", + "start": 145.94, + "end": 146.38, + "confidence": 0.357 + }, + { + "text": "de", + "start": 146.38, + "end": 146.46, + "confidence": 0.253 + }, + { + "text": "l'intempis", + "start": 146.46, + "end": 146.7, + "confidence": 0.153 + }, + { + "text": "de", + "start": 146.7, + "end": 146.9, + "confidence": 0.858 + }, + { + "text": "lâcher", + "start": 146.9, + "end": 147.32, + "confidence": 0.824 + }, + { + "text": "à", + "start": 147.32, + "end": 147.44, + "confidence": 0.494 + }, + { + "text": "l'éantrénée,", + "start": 147.44, + "end": 147.94, + "confidence": 0.476 + }, + { + "text": "ça", + "start": 147.94, + "end": 148.0, + "confidence": 0.772 + }, + { + "text": "m'a", + "start": 148.0, + "end": 148.26, + "confidence": 0.532 + }, + { + "text": "eu", + "start": 148.26, + "end": 148.42, + "confidence": 0.181 + }, + { + "text": "immédiate.", + "start": 148.42, + "end": 148.88, + "confidence": 0.537 + } + ] + }, + { + "id": 42, + "seek": 13702, + "start": 149.08, + "end": 152.02, + "text": " Bon, je dis ça pour le mome, mais évidemment, va là pour nos aussi.", + "tokens": [ + 7368, + 11, + 1506, + 717, + 2788, + 2016, + 476, + 275, + 423, + 11, + 2420, + 24724, + 11, + 2773, + 3684, + 2016, + 3269, + 6212, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.5734858703613281, + "compression_ratio": 1.5562700964630225, + "no_speech_prob": 3.1260256037057843e-06, + "confidence": 0.529, + "words": [ + { + "text": "Bon,", + "start": 149.08, + "end": 149.3, + "confidence": 0.285 + }, + { + "text": "je", + "start": 149.3, + "end": 149.34, + "confidence": 0.425 + }, + { + "text": "dis", + "start": 149.34, + "end": 149.42, + "confidence": 0.316 + }, + { + "text": "ça", + "start": 149.42, + "end": 149.62, + "confidence": 0.953 + }, + { + "text": "pour", + "start": 149.62, + "end": 149.72, + "confidence": 0.971 + }, + { + "text": "le", + "start": 149.72, + "end": 149.82, + "confidence": 0.993 + }, + { + "text": "mome,", + "start": 149.82, + "end": 150.24, + "confidence": 0.575 + }, + { + "text": "mais", + "start": 150.24, + "end": 150.44, + "confidence": 0.713 + }, + { + "text": "évidemment,", + "start": 150.44, + "end": 151.1, + "confidence": 0.775 + }, + { + "text": "va", + "start": 151.1, + "end": 151.28, + "confidence": 0.381 + }, + { + "text": "là", + "start": 151.28, + "end": 151.42, + "confidence": 0.633 + }, + { + "text": "pour", + "start": 151.42, + "end": 151.62, + "confidence": 0.398 + }, + { + "text": "nos", + "start": 151.62, + "end": 151.7, + "confidence": 0.807 + }, + { + "text": "aussi.", + "start": 151.7, + "end": 152.02, + "confidence": 0.145 + } + ] + }, + { + "id": 43, + "seek": 13702, + "start": 152.66, + "end": 154.4, + "text": " Donc, rapport immédiate d'accord.", + "tokens": [ + 7477, + 11, + 18018, + 3397, + 526, + 4504, + 473, + 274, + 6, + 19947, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.5734858703613281, + "compression_ratio": 1.5562700964630225, + "no_speech_prob": 3.1260256037057843e-06, + "confidence": 0.851, + "words": [ + { + "text": "Donc,", + "start": 152.66, + "end": 153.0, + "confidence": 0.985 + }, + { + "text": "rapport", + "start": 153.0, + "end": 153.42, + "confidence": 0.977 + }, + { + "text": "immédiate", + "start": 153.42, + "end": 154.26, + "confidence": 0.825 + }, + { + "text": "d'accord.", + "start": 154.26, + "end": 154.4, + "confidence": 0.806 + } + ] + }, + { + "id": 44, + "seek": 13702, + "start": 154.4, + "end": 157.95, + "text": " Mais pourquoi, à ton impression qu'on en sortira jamais?", + "tokens": [ + 6313, + 19934, + 11, + 1531, + 2952, + 9995, + 421, + 6, + 266, + 465, + 26906, + 64, + 14540, + 30 + ], + "temperature": 0.0, + "avg_logprob": -0.5734858703613281, + "compression_ratio": 1.5562700964630225, + "no_speech_prob": 3.1260256037057843e-06, + "confidence": 0.791, + "words": [ + { + "text": "Mais", + "start": 154.4, + "end": 155.9, + "confidence": 0.984 + }, + { + "text": "pourquoi,", + "start": 155.9, + "end": 156.36, + "confidence": 0.959 + }, + { + "text": "à", + "start": 156.36, + "end": 156.48, + "confidence": 0.821 + }, + { + "text": "ton", + "start": 156.48, + "end": 156.66, + "confidence": 0.952 + }, + { + "text": "impression", + "start": 156.66, + "end": 156.96, + "confidence": 0.932 + }, + { + "text": "qu'on", + "start": 156.96, + "end": 157.28, + "confidence": 0.906 + }, + { + "text": "en", + "start": 157.28, + "end": 157.34, + "confidence": 0.789 + }, + { + "text": "sortira", + "start": 157.34, + "end": 157.84, + "confidence": 0.543 + }, + { + "text": "jamais?", + "start": 157.84, + "end": 157.95, + "confidence": 0.503 + } + ] + }, + { + "id": 45, + "seek": 13702, + "start": 157.95, + "end": 162.37, + "text": " Et puis, il faut en remettre la faute sur les gens qui ont créé cette", + "tokens": [ + 3790, + 9093, + 11, + 1930, + 8487, + 465, + 890, + 40681, + 635, + 2050, + 1169, + 1022, + 1512, + 10668, + 1956, + 6592, + 15609, + 526, + 5550 + ], + "temperature": 0.0, + "avg_logprob": -0.5734858703613281, + "compression_ratio": 1.5562700964630225, + "no_speech_prob": 3.1260256037057843e-06, + "confidence": 0.82, + "words": [ + { + "text": "Et", + "start": 157.95, + "end": 159.26, + "confidence": 0.838 + }, + { + "text": "puis,", + "start": 159.26, + "end": 159.58, + "confidence": 0.481 + }, + { + "text": "il", + "start": 159.58, + "end": 159.62, + "confidence": 0.665 + }, + { + "text": "faut", + "start": 159.62, + "end": 159.66, + "confidence": 0.942 + }, + { + "text": "en", + "start": 159.66, + "end": 159.72, + "confidence": 0.925 + }, + { + "text": "remettre", + "start": 159.72, + "end": 160.1, + "confidence": 0.985 + }, + { + "text": "la", + "start": 160.1, + "end": 160.28, + "confidence": 0.702 + }, + { + "text": "faute", + "start": 160.28, + "end": 160.62, + "confidence": 0.55 + }, + { + "text": "sur", + "start": 160.62, + "end": 160.9, + "confidence": 0.954 + }, + { + "text": "les", + "start": 160.9, + "end": 161.22, + "confidence": 0.81 + }, + { + "text": "gens", + "start": 161.22, + "end": 161.42, + "confidence": 0.985 + }, + { + "text": "qui", + "start": 161.42, + "end": 161.58, + "confidence": 0.981 + }, + { + "text": "ont", + "start": 161.58, + "end": 161.62, + "confidence": 0.955 + }, + { + "text": "créé", + "start": 161.62, + "end": 162.3, + "confidence": 0.957 + }, + { + "text": "cette", + "start": 162.3, + "end": 162.37, + "confidence": 0.9 + } + ] + }, + { + "id": 46, + "seek": 16228, + "start": 162.37, + "end": 165.3, + "text": " route merveilleux et diabolique, qui a dit à bollique par coeur, merveilleux.", + "tokens": [ + 7955, + 3551, + 303, + 3409, + 2449, + 1030, + 33227, + 401, + 1925, + 11, + 1956, + 257, + 6176, + 1531, + 748, + 285, + 1925, + 971, + 45781, + 11, + 3551, + 303, + 3409, + 2449, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.7643054464588994, + "compression_ratio": 1.544041450777202, + "no_speech_prob": 3.89045562769752e-05, + "confidence": 0.397, + "words": [ + { + "text": "route", + "start": 162.37, + "end": 162.6, + "confidence": 0.076 + }, + { + "text": "merveilleux", + "start": 162.6, + "end": 163.3, + "confidence": 0.635 + }, + { + "text": "et", + "start": 163.3, + "end": 163.42, + "confidence": 0.837 + }, + { + "text": "diabolique,", + "start": 163.42, + "end": 163.82, + "confidence": 0.328 + }, + { + "text": "qui", + "start": 163.82, + "end": 163.9, + "confidence": 0.365 + }, + { + "text": "a", + "start": 163.9, + "end": 163.98, + "confidence": 0.054 + }, + { + "text": "dit", + "start": 163.98, + "end": 164.06, + "confidence": 0.085 + }, + { + "text": "à", + "start": 164.06, + "end": 164.1, + "confidence": 0.433 + }, + { + "text": "bollique", + "start": 164.1, + "end": 164.3, + "confidence": 0.297 + }, + { + "text": "par", + "start": 164.3, + "end": 164.52, + "confidence": 0.634 + }, + { + "text": "coeur,", + "start": 164.52, + "end": 164.78, + "confidence": 0.361 + }, + { + "text": "merveilleux.", + "start": 164.78, + "end": 165.3, + "confidence": 0.982 + } + ] + }, + { + "id": 47, + "seek": 16228, + "start": 167.36, + "end": 168.7, + "text": " Les économistes parlent de dépendance du santé.", + "tokens": [ + 6965, + 31171, + 22368, + 13734, + 317, + 368, + 45768, + 719, + 1581, + 30068, + 13 + ], + "temperature": 0.0, + "avg_logprob": -0.7643054464588994, + "compression_ratio": 1.544041450777202, + "no_speech_prob": 3.89045562769752e-05, + "confidence": 0.748, + "words": [ + { + "text": "Les", + "start": 167.36, + "end": 167.4, + "confidence": 0.513 + }, + { + "text": "économistes", + "start": 167.4, + "end": 167.5, + "confidence": 0.937 + }, + { + "text": "parlent", + "start": 167.5, + "end": 167.78, + "confidence": 0.806 + }, + { + "text": "de", + "start": 167.78, + "end": 167.82, + "confidence": 0.855 + }, + { + "text": "dépendance", + "start": 167.82, + "end": 168.32, + "confidence": 0.758 + }, + { + "text": "du", + "start": 168.32, + "end": 168.5, + "confidence": 0.979 + }, + { + "text": "santé.", + "start": 168.5, + "end": 168.7, + "confidence": 0.389 + } + ] + }, + { + "id": 48, + "seek": 16228, + "start": 168.84, + "end": 172.66, + "text": " Ces vidéos, en fait, on est un santé qui a été établie, c'est un soit mon termine,", + "tokens": [ + 28414, + 25417, + 11, + 465, + 3887, + 11, + 322, + 871, + 517, + 30068, + 1956, + 257, + 8862, + 4823, + 455, + 6302, + 11, + 269, + 6, + 377, + 517, + 12703, + 1108, + 1433, + 533, + 11 + ], + "temperature": 0.0, + "avg_logprob": -0.7643054464588994, + "compression_ratio": 1.544041450777202, + "no_speech_prob": 3.89045562769752e-05, + "confidence": 0.487, + "words": [ + { + "text": "Ces", + "start": 168.84, + "end": 169.14, + "confidence": 0.531 + }, + { + "text": "vidéos,", + "start": 169.14, + "end": 169.5, + "confidence": 0.725 + }, + { + "text": "en", + "start": 169.5, + "end": 169.62, + "confidence": 0.757 + }, + { + "text": "fait,", + "start": 169.62, + "end": 169.68, + "confidence": 0.974 + }, + { + "text": "on", + "start": 169.68, + "end": 169.74, + "confidence": 0.306 + }, + { + "text": "est", + "start": 169.74, + "end": 169.86, + "confidence": 0.82 + }, + { + "text": "un", + "start": 169.86, + "end": 170.16, + "confidence": 0.245 + }, + { + "text": "santé", + "start": 170.16, + "end": 170.72, + "confidence": 0.943 + }, + { + "text": "qui", + "start": 170.72, + "end": 170.88, + "confidence": 0.839 + }, + { + "text": "a", + "start": 170.88, + "end": 170.96, + "confidence": 0.533 + }, + { + "text": "été", + "start": 170.96, + "end": 171.08, + "confidence": 0.992 + }, + { + "text": "établie,", + "start": 171.08, + "end": 171.6, + "confidence": 0.316 + }, + { + "text": "c'est", + "start": 171.6, + "end": 171.74, + "confidence": 0.55 + }, + { + "text": "un", + "start": 171.74, + "end": 171.88, + "confidence": 0.651 + }, + { + "text": "soit", + "start": 171.88, + "end": 172.12, + "confidence": 0.284 + }, + { + "text": "mon", + "start": 172.12, + "end": 172.28, + "confidence": 0.225 + }, + { + "text": "termine,", + "start": 172.28, + "end": 172.66, + "confidence": 0.288 + } + ] + }, + { + "id": 49, + "seek": 17312, + "start": 173.14, + "end": 177.42, + "text": " soit définissant des beurs, on définisse un signalétique.", + "tokens": [ + 50364, + 12703, + 40763, + 29492, + 730, + 312, + 2156, + 11, + 322, + 40763, + 7746, + 517, + 6358, + 42379, + 13, + 51436 + ], + "temperature": 0.0, + "avg_logprob": -0.9428024291992188, + "compression_ratio": 1.0169491525423728, + "no_speech_prob": 6.687085260637105e-05, + "confidence": 0.403, + "words": [ + { + "text": "soit", + "start": 173.14, + "end": 174.04, + "confidence": 0.127 + }, + { + "text": "définissant", + "start": 174.04, + "end": 175.5, + "confidence": 0.58 + }, + { + "text": "des", + "start": 175.5, + "end": 175.68, + "confidence": 0.813 + }, + { + "text": "beurs,", + "start": 175.68, + "end": 175.96, + "confidence": 0.378 + }, + { + "text": "on", + "start": 175.96, + "end": 176.04, + "confidence": 0.165 + }, + { + "text": "définisse", + "start": 176.04, + "end": 176.42, + "confidence": 0.536 + }, + { + "text": "un", + "start": 176.42, + "end": 176.6, + "confidence": 0.266 + }, + { + "text": "signalétique.", + "start": 176.6, + "end": 177.42, + "confidence": 0.544 + } + ] + } + ], + "language": "fr" +} \ No newline at end of file diff --git a/tests/expected/tiny_fr/bonjour.wav.words.json b/tests/expected/tiny_fr/bonjour.wav.words.json new file mode 100644 index 0000000000000000000000000000000000000000..6d1d63b947661bb29dbb3d480d85dc90a4e6c115 --- /dev/null +++ b/tests/expected/tiny_fr/bonjour.wav.words.json @@ -0,0 +1,32 @@ +{ + "text": " Bonjour !", + "segments": [ + { + "id": 0, + "seek": 0, + "start": 0.14, + "end": 0.96, + "text": " Bonjour !", + "tokens": [ + 50364, + 25431, + 2298, + 50414 + ], + "temperature": 0.0, + "avg_logprob": -0.6977285861968994, + "compression_ratio": 0.5294117647058824, + "no_speech_prob": 0.019094161689281464, + "confidence": 0.829, + "words": [ + { + "text": "Bonjour !", + "start": 0.14, + "end": 0.96, + "confidence": 0.829 + } + ] + } + ], + "language": "fr" +} \ No newline at end of file diff --git a/tests/expected/tiny_fr/bonjour_vous_allez_bien.mp3.words.json b/tests/expected/tiny_fr/bonjour_vous_allez_bien.mp3.words.json new file mode 100644 index 0000000000000000000000000000000000000000..56d4282f71080f7d429dd75ef057267e85842e42 --- /dev/null +++ b/tests/expected/tiny_fr/bonjour_vous_allez_bien.mp3.words.json @@ -0,0 +1,162 @@ +{ + "text": " Bonjour ! Est-ce que vous allez bien ? Bonjour ! Esque vous allez bien !", + "segments": [ + { + "id": 0, + "seek": 0, + "start": 0.44, + "end": 1.44, + "text": " Bonjour !", + "tokens": [ + 50364, + 25431, + 2298, + 50438 + ], + "temperature": 0.0, + "avg_logprob": -0.7721260706583659, + "compression_ratio": 0.8260869565217391, + "no_speech_prob": 0.04302893579006195, + "confidence": 0.688, + "words": [ + { + "text": "Bonjour !", + "start": 0.44, + "end": 1.44, + "confidence": 0.688 + } + ] + }, + { + "id": 1, + "seek": 0, + "start": 1.88, + "end": 3.12, + "text": " Est-ce que vous allez bien ?", + "tokens": [ + 50438, + 4410, + 12, + 384, + 631, + 2630, + 18146, + 3610, + 2506, + 50538 + ], + "temperature": 0.0, + "avg_logprob": -0.7721260706583659, + "compression_ratio": 0.8260869565217391, + "no_speech_prob": 0.04302893579006195, + "confidence": 0.68, + "words": [ + { + "text": "Est-ce", + "start": 1.88, + "end": 2.2, + "confidence": 0.667 + }, + { + "text": "que", + "start": 2.2, + "end": 2.24, + "confidence": 0.873 + }, + { + "text": "vous", + "start": 2.24, + "end": 2.36, + "confidence": 0.993 + }, + { + "text": "allez", + "start": 2.36, + "end": 2.56, + "confidence": 0.268 + }, + { + "text": "bien ?", + "start": 2.56, + "end": 3.12, + "confidence": 0.973 + } + ] + }, + { + "id": 2, + "seek": 3000, + "start": 32.98, + "end": 33.48, + "text": " Bonjour !", + "tokens": [ + 50364, + 25431, + 2298, + 50514 + ], + "temperature": 0.0, + "avg_logprob": -0.9276708456186148, + "compression_ratio": 0.8048780487804879, + "no_speech_prob": 0.3543654680252075, + "confidence": 0.533, + "words": [ + { + "text": "Bonjour !", + "start": 32.98, + "end": 33.48, + "confidence": 0.533 + } + ] + }, + { + "id": 3, + "seek": 3000, + "start": 34.42, + "end": 35.48, + "text": " Esque vous allez bien !", + "tokens": [ + 50514, + 2313, + 1077, + 2630, + 18146, + 3610, + 2298, + 50614 + ], + "temperature": 0.0, + "avg_logprob": -0.9276708456186148, + "compression_ratio": 0.8048780487804879, + "no_speech_prob": 0.3543654680252075, + "confidence": 0.484, + "words": [ + { + "text": "Esque", + "start": 34.42, + "end": 34.76, + "confidence": 0.186 + }, + { + "text": "vous", + "start": 34.76, + "end": 34.9, + "confidence": 0.982 + }, + { + "text": "allez", + "start": 34.9, + "end": 35.08, + "confidence": 0.781 + }, + { + "text": "bien !", + "start": 35.08, + "end": 35.48, + "confidence": 0.998 + } + ] + } + ], + "language": "fr" +} \ No newline at end of file diff --git a/tests/expected/tiny_fr/empty.mp3.words.json b/tests/expected/tiny_fr/empty.mp3.words.json new file mode 100644 index 0000000000000000000000000000000000000000..cd4c337f3962718881cc93300e57e4f7d05feedb --- /dev/null +++ b/tests/expected/tiny_fr/empty.mp3.words.json @@ -0,0 +1,5 @@ +{ + "text": "", + "segments": [], + "language": "fr" +} \ No newline at end of file diff --git a/tests/expected/tiny_fr/gaenswein15.mp3.words.json b/tests/expected/tiny_fr/gaenswein15.mp3.words.json new file mode 100644 index 0000000000000000000000000000000000000000..5bcf408187d102ee5d53ff99f31d8daa29e14bdc --- /dev/null +++ b/tests/expected/tiny_fr/gaenswein15.mp3.words.json @@ -0,0 +1,71 @@ +{ + "text": " Leur de l'Ontario est de la", + "segments": [ + { + "id": 0, + "seek": 0, + "start": 20.14, + "end": 24.68, + "text": " Leur de l'Ontario est de la", + "tokens": [ + 50364, + 1456, + 374, + 368, + 287, + 6, + 46, + 580, + 4912, + 871, + 368, + 635, + 51571 + ], + "temperature": 0.0, + "avg_logprob": -1.7974119186401367, + "compression_ratio": 0.84375, + "no_speech_prob": 0.04553895816206932, + "confidence": 0.152, + "words": [ + { + "text": "Leur", + "start": 20.14, + "end": 20.16, + "confidence": 0.055 + }, + { + "text": "de", + "start": 20.16, + "end": 20.18, + "confidence": 0.11 + }, + { + "text": "l'Ontario", + "start": 20.18, + "end": 24.62, + "confidence": 0.309 + }, + { + "text": "est", + "start": 24.62, + "end": 24.64, + "confidence": 0.128 + }, + { + "text": "de", + "start": 24.64, + "end": 24.66, + "confidence": 0.063 + }, + { + "text": "la", + "start": 24.66, + "end": 24.68, + "confidence": 0.133 + } + ] + } + ], + "language": "fr" +} \ No newline at end of file diff --git a/tests/expected/tiny_fr/gloria.mp3.words.json b/tests/expected/tiny_fr/gloria.mp3.words.json new file mode 100644 index 0000000000000000000000000000000000000000..5889dee1fb218b037b23960a5c1bf352861a0323 --- /dev/null +++ b/tests/expected/tiny_fr/gloria.mp3.words.json @@ -0,0 +1,1584 @@ +{ + "text": " Je suis très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très", + "segments": [ + { + "id": 0, + "seek": 0, + "start": 1.34, + "end": 29.98, + "text": " Je suis très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très très", + "tokens": [ + 50364, + 2588, + 7624, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732, + 5732 + ], + "temperature": 0.0, + "avg_logprob": -0.3070239596896701, + "compression_ratio": 43.0, + "no_speech_prob": 0.11146047711372375, + "confidence": 0.734, + "words": [ + { + "text": "Je", + "start": 1.34, + "end": 5.76, + "confidence": 0.043 + }, + { + "text": "suis", + "start": 5.76, + "end": 5.92, + "confidence": 0.156 + }, + { + "text": "très", + "start": 5.92, + "end": 6.2, + "confidence": 0.053 + }, + { + "text": "très", + "start": 6.2, + "end": 10.56, + "confidence": 0.106 + }, + { + "text": "très", + "start": 10.56, + "end": 11.22, + "confidence": 0.159 + }, + { + "text": "très", + "start": 11.22, + "end": 11.34, + "confidence": 0.186 + }, + { + "text": "très", + "start": 11.34, + "end": 11.36, + "confidence": 0.201 + }, + { + "text": "très", + "start": 11.36, + "end": 11.38, + "confidence": 0.228 + }, + { + "text": "très", + "start": 11.38, + "end": 11.4, + "confidence": 0.255 + }, + { + "text": "très", + "start": 11.4, + "end": 11.42, + "confidence": 0.281 + }, + { + "text": "très", + "start": 11.42, + "end": 11.44, + "confidence": 0.322 + }, + { + "text": "très", + "start": 11.44, + "end": 11.46, + "confidence": 0.382 + }, + { + "text": "très", + "start": 11.46, + "end": 11.48, + "confidence": 0.457 + }, + { + "text": "très", + "start": 11.48, + "end": 11.5, + "confidence": 0.537 + }, + { + "text": "très", + "start": 11.5, + "end": 11.52, + "confidence": 0.592 + }, + { + "text": "très", + "start": 11.52, + "end": 11.54, + "confidence": 0.634 + }, + { + "text": "très", + "start": 11.54, + "end": 11.56, + "confidence": 0.67 + }, + { + "text": "très", + "start": 11.56, + "end": 11.58, + "confidence": 0.69 + }, + { + "text": "très", + "start": 11.58, + "end": 11.6, + "confidence": 0.704 + }, + { + "text": "très", + "start": 11.6, + "end": 11.62, + "confidence": 0.719 + }, + { + "text": "très", + "start": 11.62, + "end": 11.64, + "confidence": 0.723 + }, + { + "text": "très", + "start": 11.64, + "end": 11.66, + "confidence": 0.735 + }, + { + "text": "très", + "start": 11.66, + "end": 11.68, + "confidence": 0.74 + }, + { + "text": "très", + "start": 11.68, + "end": 11.7, + "confidence": 0.75 + }, + { + "text": "très", + "start": 11.7, + "end": 11.72, + "confidence": 0.752 + }, + { + "text": "très", + "start": 11.72, + "end": 11.74, + "confidence": 0.751 + }, + { + "text": "très", + "start": 11.74, + "end": 11.76, + "confidence": 0.754 + }, + { + "text": "très", + "start": 11.76, + "end": 11.78, + "confidence": 0.755 + }, + { + "text": "très", + "start": 11.78, + "end": 11.8, + "confidence": 0.761 + }, + { + "text": "très", + "start": 11.8, + "end": 11.82, + "confidence": 0.76 + }, + { + "text": "très", + "start": 11.82, + "end": 11.84, + "confidence": 0.76 + }, + { + "text": "très", + "start": 11.84, + "end": 11.86, + "confidence": 0.766 + }, + { + "text": "très", + "start": 11.86, + "end": 11.88, + "confidence": 0.769 + }, + { + "text": "très", + "start": 11.88, + "end": 11.9, + "confidence": 0.769 + }, + { + "text": "très", + "start": 11.9, + "end": 11.92, + "confidence": 0.768 + }, + { + "text": "très", + "start": 11.92, + "end": 11.94, + "confidence": 0.77 + }, + { + "text": "très", + "start": 11.94, + "end": 11.96, + "confidence": 0.772 + }, + { + "text": "très", + "start": 11.96, + "end": 11.98, + "confidence": 0.775 + }, + { + "text": "très", + "start": 11.98, + "end": 12.0, + "confidence": 0.776 + }, + { + "text": "très", + "start": 12.0, + "end": 12.02, + "confidence": 0.776 + }, + { + "text": "très", + "start": 12.02, + "end": 12.8, + "confidence": 0.779 + }, + { + "text": "très", + "start": 12.8, + "end": 13.7, + "confidence": 0.782 + }, + { + "text": "très", + "start": 13.7, + "end": 13.72, + "confidence": 0.786 + }, + { + "text": "très", + "start": 13.72, + "end": 14.74, + "confidence": 0.781 + }, + { + "text": "très", + "start": 14.74, + "end": 14.76, + "confidence": 0.779 + }, + { + "text": "très", + "start": 14.76, + "end": 14.96, + "confidence": 0.784 + }, + { + "text": "très", + "start": 14.96, + "end": 14.98, + "confidence": 0.784 + }, + { + "text": "très", + "start": 14.98, + "end": 15.94, + "confidence": 0.785 + }, + { + "text": "très", + "start": 15.94, + "end": 15.96, + "confidence": 0.787 + }, + { + "text": "très", + "start": 15.96, + "end": 15.98, + "confidence": 0.787 + }, + { + "text": "très", + "start": 15.98, + "end": 16.0, + "confidence": 0.791 + }, + { + "text": "très", + "start": 16.0, + "end": 16.02, + "confidence": 0.79 + }, + { + "text": "très", + "start": 16.02, + "end": 16.04, + "confidence": 0.788 + }, + { + "text": "très", + "start": 16.04, + "end": 16.06, + "confidence": 0.788 + }, + { + "text": "très", + "start": 16.06, + "end": 16.08, + "confidence": 0.787 + }, + { + "text": "très", + "start": 16.08, + "end": 17.54, + "confidence": 0.793 + }, + { + "text": "très", + "start": 17.54, + "end": 17.56, + "confidence": 0.791 + }, + { + "text": "très", + "start": 17.56, + "end": 17.58, + "confidence": 0.793 + }, + { + "text": "très", + "start": 17.58, + "end": 17.6, + "confidence": 0.794 + }, + { + "text": "très", + "start": 17.6, + "end": 17.62, + "confidence": 0.798 + }, + { + "text": "très", + "start": 17.62, + "end": 17.64, + "confidence": 0.795 + }, + { + "text": "très", + "start": 17.64, + "end": 17.66, + "confidence": 0.796 + }, + { + "text": "très", + "start": 17.66, + "end": 17.68, + "confidence": 0.796 + }, + { + "text": "très", + "start": 17.68, + "end": 17.7, + "confidence": 0.799 + }, + { + "text": "très", + "start": 17.7, + "end": 17.72, + "confidence": 0.801 + }, + { + "text": "très", + "start": 17.72, + "end": 17.74, + "confidence": 0.804 + }, + { + "text": "très", + "start": 17.74, + "end": 17.76, + "confidence": 0.803 + }, + { + "text": "très", + "start": 17.76, + "end": 17.78, + "confidence": 0.801 + }, + { + "text": "très", + "start": 17.78, + "end": 17.8, + "confidence": 0.805 + }, + { + "text": "très", + "start": 17.8, + "end": 17.82, + "confidence": 0.806 + }, + { + "text": "très", + "start": 17.82, + "end": 17.84, + "confidence": 0.808 + }, + { + "text": "très", + "start": 17.84, + "end": 17.86, + "confidence": 0.811 + }, + { + "text": "très", + "start": 17.86, + "end": 17.88, + "confidence": 0.814 + }, + { + "text": "très", + "start": 17.88, + "end": 17.9, + "confidence": 0.817 + }, + { + "text": "très", + "start": 17.9, + "end": 17.92, + "confidence": 0.819 + }, + { + "text": "très", + "start": 17.92, + "end": 17.94, + "confidence": 0.82 + }, + { + "text": "très", + "start": 17.94, + "end": 17.96, + "confidence": 0.823 + }, + { + "text": "très", + "start": 17.96, + "end": 17.98, + "confidence": 0.823 + }, + { + "text": "très", + "start": 17.98, + "end": 19.34, + "confidence": 0.827 + }, + { + "text": "très", + "start": 19.34, + "end": 19.36, + "confidence": 0.828 + }, + { + "text": "très", + "start": 19.36, + "end": 19.38, + "confidence": 0.835 + }, + { + "text": "très", + "start": 19.38, + "end": 19.4, + "confidence": 0.836 + }, + { + "text": "très", + "start": 19.4, + "end": 19.42, + "confidence": 0.839 + }, + { + "text": "très", + "start": 19.42, + "end": 19.44, + "confidence": 0.838 + }, + { + "text": "très", + "start": 19.44, + "end": 19.46, + "confidence": 0.841 + }, + { + "text": "très", + "start": 19.46, + "end": 19.48, + "confidence": 0.841 + }, + { + "text": "très", + "start": 19.48, + "end": 19.5, + "confidence": 0.843 + }, + { + "text": "très", + "start": 19.5, + "end": 19.52, + "confidence": 0.844 + }, + { + "text": "très", + "start": 19.52, + "end": 19.54, + "confidence": 0.848 + }, + { + "text": "très", + "start": 19.54, + "end": 19.56, + "confidence": 0.849 + }, + { + "text": "très", + "start": 19.56, + "end": 19.58, + "confidence": 0.848 + }, + { + "text": "très", + "start": 19.58, + "end": 19.6, + "confidence": 0.849 + }, + { + "text": "très", + "start": 19.6, + "end": 19.62, + "confidence": 0.852 + }, + { + "text": "très", + "start": 19.62, + "end": 19.64, + "confidence": 0.851 + }, + { + "text": "très", + "start": 19.64, + "end": 20.06, + "confidence": 0.852 + }, + { + "text": "très", + "start": 20.06, + "end": 20.14, + "confidence": 0.854 + }, + { + "text": "très", + "start": 20.14, + "end": 20.16, + "confidence": 0.854 + }, + { + "text": "très", + "start": 20.16, + "end": 20.18, + "confidence": 0.857 + }, + { + "text": "très", + "start": 20.18, + "end": 20.2, + "confidence": 0.857 + }, + { + "text": "très", + "start": 20.2, + "end": 20.22, + "confidence": 0.858 + }, + { + "text": "très", + "start": 20.22, + "end": 20.56, + "confidence": 0.859 + }, + { + "text": "très", + "start": 20.56, + "end": 20.58, + "confidence": 0.858 + }, + { + "text": "très", + "start": 20.58, + "end": 20.6, + "confidence": 0.86 + }, + { + "text": "très", + "start": 20.6, + "end": 20.62, + "confidence": 0.861 + }, + { + "text": "très", + "start": 20.62, + "end": 20.64, + "confidence": 0.864 + }, + { + "text": "très", + "start": 20.64, + "end": 20.66, + "confidence": 0.866 + }, + { + "text": "très", + "start": 20.66, + "end": 20.68, + "confidence": 0.866 + }, + { + "text": "très", + "start": 20.68, + "end": 20.7, + "confidence": 0.866 + }, + { + "text": "très", + "start": 20.7, + "end": 20.72, + "confidence": 0.862 + }, + { + "text": "très", + "start": 20.72, + "end": 20.74, + "confidence": 0.863 + }, + { + "text": "très", + "start": 20.74, + "end": 20.76, + "confidence": 0.864 + }, + { + "text": "très", + "start": 20.76, + "end": 20.78, + "confidence": 0.864 + }, + { + "text": "très", + "start": 20.78, + "end": 20.8, + "confidence": 0.862 + }, + { + "text": "très", + "start": 20.8, + "end": 20.82, + "confidence": 0.861 + }, + { + "text": "très", + "start": 20.82, + "end": 20.84, + "confidence": 0.863 + }, + { + "text": "très", + "start": 20.84, + "end": 20.86, + "confidence": 0.862 + }, + { + "text": "très", + "start": 20.86, + "end": 20.88, + "confidence": 0.859 + }, + { + "text": "très", + "start": 20.88, + "end": 20.9, + "confidence": 0.855 + }, + { + "text": "très", + "start": 20.9, + "end": 20.92, + "confidence": 0.858 + }, + { + "text": "très", + "start": 20.92, + "end": 20.94, + "confidence": 0.856 + }, + { + "text": "très", + "start": 20.94, + "end": 20.96, + "confidence": 0.853 + }, + { + "text": "très", + "start": 20.96, + "end": 20.98, + "confidence": 0.849 + }, + { + "text": "très", + "start": 20.98, + "end": 21.0, + "confidence": 0.851 + }, + { + "text": "très", + "start": 21.0, + "end": 21.02, + "confidence": 0.853 + }, + { + "text": "très", + "start": 21.02, + "end": 21.04, + "confidence": 0.853 + }, + { + "text": "très", + "start": 21.04, + "end": 21.06, + "confidence": 0.848 + }, + { + "text": "très", + "start": 21.06, + "end": 21.08, + "confidence": 0.849 + }, + { + "text": "très", + "start": 21.08, + "end": 21.1, + "confidence": 0.851 + }, + { + "text": "très", + "start": 21.1, + "end": 21.12, + "confidence": 0.845 + }, + { + "text": "très", + "start": 21.12, + "end": 21.14, + "confidence": 0.849 + }, + { + "text": "très", + "start": 21.14, + "end": 21.16, + "confidence": 0.851 + }, + { + "text": "très", + "start": 21.16, + "end": 21.18, + "confidence": 0.851 + }, + { + "text": "très", + "start": 21.18, + "end": 21.2, + "confidence": 0.85 + }, + { + "text": "très", + "start": 21.2, + "end": 21.22, + "confidence": 0.847 + }, + { + "text": "très", + "start": 21.22, + "end": 21.24, + "confidence": 0.846 + }, + { + "text": "très", + "start": 21.24, + "end": 21.26, + "confidence": 0.843 + }, + { + "text": "très", + "start": 21.26, + "end": 21.28, + "confidence": 0.844 + }, + { + "text": "très", + "start": 21.28, + "end": 21.3, + "confidence": 0.846 + }, + { + "text": "très", + "start": 21.3, + "end": 21.32, + "confidence": 0.838 + }, + { + "text": "très", + "start": 21.32, + "end": 21.34, + "confidence": 0.842 + }, + { + "text": "très", + "start": 21.34, + "end": 21.36, + "confidence": 0.841 + }, + { + "text": "très", + "start": 21.36, + "end": 21.38, + "confidence": 0.845 + }, + { + "text": "très", + "start": 21.38, + "end": 21.4, + "confidence": 0.839 + }, + { + "text": "très", + "start": 21.4, + "end": 21.42, + "confidence": 0.833 + }, + { + "text": "très", + "start": 21.42, + "end": 21.44, + "confidence": 0.826 + }, + { + "text": "très", + "start": 21.44, + "end": 21.46, + "confidence": 0.824 + }, + { + "text": "très", + "start": 21.46, + "end": 21.48, + "confidence": 0.824 + }, + { + "text": "très", + "start": 21.48, + "end": 21.5, + "confidence": 0.821 + }, + { + "text": "très", + "start": 21.5, + "end": 21.52, + "confidence": 0.823 + }, + { + "text": "très", + "start": 21.52, + "end": 21.54, + "confidence": 0.821 + }, + { + "text": "très", + "start": 21.54, + "end": 21.56, + "confidence": 0.827 + }, + { + "text": "très", + "start": 21.56, + "end": 21.58, + "confidence": 0.819 + }, + { + "text": "très", + "start": 21.58, + "end": 21.6, + "confidence": 0.816 + }, + { + "text": "très", + "start": 21.6, + "end": 21.62, + "confidence": 0.815 + }, + { + "text": "très", + "start": 21.62, + "end": 21.64, + "confidence": 0.815 + }, + { + "text": "très", + "start": 21.64, + "end": 21.66, + "confidence": 0.819 + }, + { + "text": "très", + "start": 21.66, + "end": 21.68, + "confidence": 0.811 + }, + { + "text": "très", + "start": 21.68, + "end": 21.7, + "confidence": 0.821 + }, + { + "text": "très", + "start": 21.7, + "end": 21.72, + "confidence": 0.811 + }, + { + "text": "très", + "start": 21.72, + "end": 21.74, + "confidence": 0.816 + }, + { + "text": "très", + "start": 21.74, + "end": 21.76, + "confidence": 0.819 + }, + { + "text": "très", + "start": 21.76, + "end": 21.78, + "confidence": 0.812 + }, + { + "text": "très", + "start": 21.78, + "end": 21.8, + "confidence": 0.815 + }, + { + "text": "très", + "start": 21.8, + "end": 21.82, + "confidence": 0.813 + }, + { + "text": "très", + "start": 21.82, + "end": 21.84, + "confidence": 0.811 + }, + { + "text": "très", + "start": 21.84, + "end": 21.86, + "confidence": 0.809 + }, + { + "text": "très", + "start": 21.86, + "end": 21.88, + "confidence": 0.802 + }, + { + "text": "très", + "start": 21.88, + "end": 21.9, + "confidence": 0.802 + }, + { + "text": "très", + "start": 21.9, + "end": 21.92, + "confidence": 0.798 + }, + { + "text": "très", + "start": 21.92, + "end": 21.94, + "confidence": 0.792 + }, + { + "text": "très", + "start": 21.94, + "end": 21.96, + "confidence": 0.802 + }, + { + "text": "très", + "start": 21.96, + "end": 21.98, + "confidence": 0.784 + }, + { + "text": "très", + "start": 21.98, + "end": 22.0, + "confidence": 0.78 + }, + { + "text": "très", + "start": 22.0, + "end": 22.02, + "confidence": 0.782 + }, + { + "text": "très", + "start": 22.02, + "end": 22.04, + "confidence": 0.783 + }, + { + "text": "très", + "start": 22.04, + "end": 22.06, + "confidence": 0.777 + }, + { + "text": "très", + "start": 22.06, + "end": 22.08, + "confidence": 0.778 + }, + { + "text": "très", + "start": 22.08, + "end": 22.1, + "confidence": 0.787 + }, + { + "text": "très", + "start": 22.1, + "end": 22.12, + "confidence": 0.789 + }, + { + "text": "très", + "start": 22.12, + "end": 22.14, + "confidence": 0.788 + }, + { + "text": "très", + "start": 22.14, + "end": 22.16, + "confidence": 0.788 + }, + { + "text": "très", + "start": 22.16, + "end": 22.18, + "confidence": 0.784 + }, + { + "text": "très", + "start": 22.18, + "end": 22.2, + "confidence": 0.777 + }, + { + "text": "très", + "start": 22.2, + "end": 22.22, + "confidence": 0.783 + }, + { + "text": "très", + "start": 22.22, + "end": 22.24, + "confidence": 0.793 + }, + { + "text": "très", + "start": 22.24, + "end": 22.26, + "confidence": 0.794 + }, + { + "text": "très", + "start": 22.26, + "end": 22.28, + "confidence": 0.782 + }, + { + "text": "très", + "start": 22.28, + "end": 22.3, + "confidence": 0.788 + }, + { + "text": "très", + "start": 22.3, + "end": 22.32, + "confidence": 0.787 + }, + { + "text": "très", + "start": 22.32, + "end": 22.34, + "confidence": 0.782 + }, + { + "text": "très", + "start": 22.34, + "end": 22.36, + "confidence": 0.781 + }, + { + "text": "très", + "start": 22.36, + "end": 22.38, + "confidence": 0.788 + }, + { + "text": "très", + "start": 22.38, + "end": 22.4, + "confidence": 0.775 + }, + { + "text": "très", + "start": 22.4, + "end": 22.42, + "confidence": 0.777 + }, + { + "text": "très", + "start": 22.42, + "end": 22.44, + "confidence": 0.778 + }, + { + "text": "très", + "start": 22.44, + "end": 22.46, + "confidence": 0.77 + }, + { + "text": "très", + "start": 22.46, + "end": 22.48, + "confidence": 0.768 + }, + { + "text": "très", + "start": 22.48, + "end": 22.5, + "confidence": 0.768 + }, + { + "text": "très", + "start": 22.5, + "end": 22.52, + "confidence": 0.775 + }, + { + "text": "très", + "start": 22.52, + "end": 22.54, + "confidence": 0.763 + }, + { + "text": "très", + "start": 22.54, + "end": 22.56, + "confidence": 0.768 + }, + { + "text": "très", + "start": 22.56, + "end": 22.58, + "confidence": 0.759 + }, + { + "text": "très", + "start": 22.58, + "end": 22.6, + "confidence": 0.771 + }, + { + "text": "très", + "start": 22.6, + "end": 22.62, + "confidence": 0.764 + }, + { + "text": "très", + "start": 22.62, + "end": 22.64, + "confidence": 0.763 + }, + { + "text": "très", + "start": 22.64, + "end": 22.66, + "confidence": 0.772 + }, + { + "text": "très", + "start": 22.66, + "end": 22.68, + "confidence": 0.774 + }, + { + "text": "très", + "start": 22.68, + "end": 22.7, + "confidence": 0.764 + }, + { + "text": "très", + "start": 22.7, + "end": 22.72, + "confidence": 0.763 + }, + { + "text": "très", + "start": 22.72, + "end": 22.74, + "confidence": 0.755 + }, + { + "text": "très", + "start": 22.74, + "end": 22.76, + "confidence": 0.766 + }, + { + "text": "très", + "start": 22.76, + "end": 22.78, + "confidence": 0.766 + }, + { + "text": "très", + "start": 22.78, + "end": 22.8, + "confidence": 0.759 + }, + { + "text": "très", + "start": 22.8, + "end": 22.82, + "confidence": 0.768 + }, + { + "text": "très", + "start": 22.82, + "end": 23.04, + "confidence": 0.762 + }, + { + "text": "très", + "start": 23.04, + "end": 23.06, + "confidence": 0.764 + }, + { + "text": "très", + "start": 23.06, + "end": 23.08, + "confidence": 0.775 + }, + { + "text": "très", + "start": 23.08, + "end": 23.1, + "confidence": 0.785 + }, + { + "text": "très", + "start": 23.1, + "end": 23.5, + "confidence": 0.783 + }, + { + "text": "très", + "start": 23.5, + "end": 23.52, + "confidence": 0.792 + }, + { + "text": "très", + "start": 23.52, + "end": 23.54, + "confidence": 0.822 + }, + { + "text": "très", + "start": 23.54, + "end": 26.7, + "confidence": 0.791 + }, + { + "text": "très", + "start": 26.7, + "end": 29.98, + "confidence": 0.775 + } + ] + } + ], + "language": "fr" +} \ No newline at end of file diff --git a/tests/expected/tiny_fr/laugh1.mp3.words.json b/tests/expected/tiny_fr/laugh1.mp3.words.json new file mode 100644 index 0000000000000000000000000000000000000000..eb2fd3f9aad12383bae10efd67b83d1b964fe781 --- /dev/null +++ b/tests/expected/tiny_fr/laugh1.mp3.words.json @@ -0,0 +1,81 @@ +{ + "text": " Je vais vous donner un peu de temps.", + "segments": [ + { + "id": 0, + "seek": 0, + "start": 0.18, + "end": 1.72, + "text": " Je vais vous donner un peu de temps.", + "tokens": [ + 50364, + 2588, + 9369, + 2630, + 20882, + 517, + 5604, + 368, + 8827, + 13, + 50464 + ], + "temperature": 0.0, + "avg_logprob": -1.8613839149475098, + "compression_ratio": 0.8181818181818182, + "no_speech_prob": 0.4180056154727936, + "confidence": 0.103, + "words": [ + { + "text": "Je", + "start": 0.18, + "end": 0.82, + "confidence": 0.066 + }, + { + "text": "vais", + "start": 0.82, + "end": 1.04, + "confidence": 0.128 + }, + { + "text": "vous", + "start": 1.04, + "end": 1.06, + "confidence": 0.075 + }, + { + "text": "donner", + "start": 1.06, + "end": 1.26, + "confidence": 0.048 + }, + { + "text": "un", + "start": 1.26, + "end": 1.66, + "confidence": 0.144 + }, + { + "text": "peu", + "start": 1.66, + "end": 1.68, + "confidence": 0.091 + }, + { + "text": "de", + "start": 1.68, + "end": 1.7, + "confidence": 0.625 + }, + { + "text": "temps.", + "start": 1.7, + "end": 1.72, + "confidence": 0.053 + } + ] + } + ], + "language": "fr" +} \ No newline at end of file diff --git a/tests/expected/tiny_fr/laugh2.mp3.words.json b/tests/expected/tiny_fr/laugh2.mp3.words.json new file mode 100644 index 0000000000000000000000000000000000000000..f1d7d6f65ef571345c23b4098d89aad0a0ce1517 --- /dev/null +++ b/tests/expected/tiny_fr/laugh2.mp3.words.json @@ -0,0 +1,31 @@ +{ + "text": " ...", + "segments": [ + { + "id": 0, + "seek": 0, + "start": 0.18, + "end": 0.66, + "text": " ...", + "tokens": [ + 50364, + 1097, + 50414 + ], + "temperature": 0.0, + "avg_logprob": -1.2521450519561768, + "compression_ratio": 0.2727272727272727, + "no_speech_prob": 0.5721203088760376, + "confidence": 0.088, + "words": [ + { + "text": "...", + "start": 0.18, + "end": 0.66, + "confidence": 0.088 + } + ] + } + ], + "language": "fr" +} \ No newline at end of file diff --git a/tests/expected/tiny_fr/punctuations.mp3.words.json b/tests/expected/tiny_fr/punctuations.mp3.words.json new file mode 100644 index 0000000000000000000000000000000000000000..1f16958b6309f821036a0f5a21562201b9249ac3 --- /dev/null +++ b/tests/expected/tiny_fr/punctuations.mp3.words.json @@ -0,0 +1,71 @@ +{ + "text": " Dima, est ce que l'on vole ?", + "segments": [ + { + "id": 0, + "seek": 0, + "start": 0.42, + "end": 2.58, + "text": " Dima, est ce que l'on vole ?", + "tokens": [ + 50364, + 413, + 4775, + 11, + 871, + 1769, + 631, + 287, + 6, + 266, + 49877, + 2506, + 50494 + ], + "temperature": 0.0, + "avg_logprob": -0.8432660784040179, + "compression_ratio": 0.7777777777777778, + "no_speech_prob": 0.0010773586109280586, + "confidence": 0.456, + "words": [ + { + "text": "Dima,", + "start": 0.42, + "end": 0.84, + "confidence": 0.247 + }, + { + "text": "est", + "start": 1.2, + "end": 1.4, + "confidence": 0.93 + }, + { + "text": "ce", + "start": 1.4, + "end": 1.56, + "confidence": 0.587 + }, + { + "text": "que", + "start": 1.56, + "end": 1.68, + "confidence": 0.916 + }, + { + "text": "l'on", + "start": 1.68, + "end": 2.02, + "confidence": 0.481 + }, + { + "text": "vole ?", + "start": 2.02, + "end": 2.58, + "confidence": 0.249 + } + ] + } + ], + "language": "fr" +} \ No newline at end of file diff --git a/tests/expected/tiny_fr/radio_short.mp3.words.json b/tests/expected/tiny_fr/radio_short.mp3.words.json new file mode 100644 index 0000000000000000000000000000000000000000..89ebc4084194b018f68524608248adb9cce76c01 --- /dev/null +++ b/tests/expected/tiny_fr/radio_short.mp3.words.json @@ -0,0 +1,106 @@ +{ + "text": " ... ... ... ...", + "segments": [ + { + "id": 0, + "seek": 0, + "start": 0.44, + "end": 1.46, + "text": " ...", + "tokens": [ + 50364, + 1097, + 50614 + ], + "temperature": 0.0, + "avg_logprob": -1.4211220741271973, + "compression_ratio": 0.2727272727272727, + "no_speech_prob": 0.5096546411514282, + "confidence": 0.224, + "words": [ + { + "text": "...", + "start": 0.44, + "end": 1.46, + "confidence": 0.224 + } + ] + }, + { + "id": 1, + "seek": 6000, + "start": 60.0, + "end": 69.42, + "text": " ...", + "tokens": [ + 50364, + 1097, + 51714 + ], + "temperature": 0.0, + "avg_logprob": -0.965636134147644, + "compression_ratio": 0.2727272727272727, + "no_speech_prob": 0.8783581256866455, + "confidence": 0.464, + "words": [ + { + "text": "...", + "start": 60.0, + "end": 69.42, + "confidence": 0.464 + } + ] + }, + { + "id": 2, + "seek": 9000, + "start": 105.48, + "end": 105.5, + "text": " ...", + "tokens": [ + 50364, + 1097, + 51114 + ], + "temperature": 0.0, + "avg_logprob": -0.8222528457641601, + "compression_ratio": 0.2727272727272727, + "no_speech_prob": 0.640861988067627, + "confidence": 0.842, + "words": [ + { + "text": "...", + "start": 105.48, + "end": 105.5, + "confidence": 0.842 + } + ] + }, + { + "id": 3, + "seek": 10500, + "start": 106.84, + "end": 108.62, + "text": " ...", + "tokens": [ + 50414, + 1097, + 50864 + ], + "temperature": 0.0, + "avg_logprob": -0.923416793346405, + "compression_ratio": 0.2727272727272727, + "no_speech_prob": 0.8327455520629883, + "confidence": 0.47, + "words": [ + { + "text": "...", + "start": 106.84, + "end": 108.62, + "confidence": 0.47 + } + ] + } + ], + "language": "fr" +} \ No newline at end of file diff --git a/tests/expected/tiny_fr/smartphone.mp3.words.json b/tests/expected/tiny_fr/smartphone.mp3.words.json new file mode 100644 index 0000000000000000000000000000000000000000..2cc965cbb861935e22aec7bb1065ee2edbc145c8 --- /dev/null +++ b/tests/expected/tiny_fr/smartphone.mp3.words.json @@ -0,0 +1,5091 @@ +{ + "text": " C'est évidence que dit Nicolas, mais je me l'étais jamais formulé comme ça. Ce qui fait la force du smartphone, c'est pas seulement la cumulation des fonctions, mais la manière dans quelques interagues entraîne. Et il est d'ailleurs, c'est la photo c'est hyper convaincant. Alors évidemment, il faudrait ajouter les interfaces les grand-attachilles à été beaucoup très souvent mentionnées. Mais bon, il faudrait que les profites aussi de 20 ans pendant l'été, les ordinateurs nous ont appris à piquer sur des icônes, sauf que, alors le smartphone ajoute le toucher, qui rend le contact plus direct, plus sensible. Et puis, évidemment, il faudrait parler aussi des applications qui permettent de contourner le côté tout flu de la navigation web pour aller directement en but. Bref, tout ça, ce sont les conditions qui permettent de créer cette objet, en Nicolas, dit qu'il est très symbolablement inédit dans l'histoire de l'humanité. Mais ça s'assoulait d'une autre interrogation. Est-ce que le fait que cette objet soit inédit un d'huits que notre rapport a lui est aussi un rapport inédit ? Est-ce que le rapport qu'on a au sein de foi n'est comparable à celui qu'on entretenait à d'autres objectes techniques comme la voiture ou le téléphone ? Il n'y a pas d'équivalent. On s'est espèrent de nous voter dans la relation à l'objet. C'est facilement éterricion. Parce que la passion de l'utilisateur et ses affices a dépendance, cette objet d'un lieu en fait, une espèce de relation de médiation avec le monde qui rendent encore avec la maille de celles formes de rogeur. Donc, à objets inédits, rapport inédits. Et, ce rapport, si j'en prends Nicolas, frère caractérisée par un mélange de dépendance et de rogeur. Bon, en vrai, il faudrait remonter très, très filmant tout l'histoire des objectes techniques et de leur infertion dans nos vieux pour déterminer si ce rapport est totalement inédit. Mais j'ai l'impression comme ça que Nicolas se trompe pas vraiment. Pour autant, je sache. Il y a eu plein de discussions autour de la voiture ou même du téléphone. Mais, la dépense n'était pas du même mort, donc le rejet n'en plus n'était pas du même mort. On peut adorer sa bagnure. On a par besoin pour plein de choses. Et là, le soir, quand on va se coucher, on la laisse. On la pade en la main quand on est colis, qu'on n'a même pas au chiot. On pouvait être émervé par son mome qui occupeait la ligne de téléphone pendant une heure chaque soir pour discuter avec un copain. Mais ça ne ressemble pas à ce qu'on peut ressentir à voir même mome aujourd'hui. Continuellement avec son smartphone dans la main, comme c'était une sorte de estimateur extère de tomber de lâcher à l'éantrénée, ça m'a eu immédiate. Bon, je dis ça pour le mome, mais évidemment, va là, bon aussi. Donc, rapport immédiate d'accord. Mais pourquoi, à ton impression qu'on en sortira, j'amé? Et puis, il faut en remettre la faute sur les gens qui ont créé cette critique merveilleux et diabolique et diabolique par que merveilleux. Les économistes parlent de dépendance du santé. Ces vidéos, en fait, on est un santé qui a été étabis, un soit mon termine, en marchand dessus, soit des finissants débordes, des finissants, une signalétique.", + "segments": [ + { + "id": 0, + "seek": 0, + "start": 0.42, + "end": 3.66, + "text": " C'est évidence que dit Nicolas, mais je me l'étais jamais formulé comme ça.", + "tokens": [ + 50364, + 383, + 6, + 377, + 20090, + 2778, + 631, + 6176, + 38268, + 11, + 2420, + 1506, + 385, + 287, + 6, + 22824, + 14540, + 49990, + 526, + 5173, + 2788, + 13, + 50545 + ], + "temperature": 0.0, + "avg_logprob": -0.5389881480823864, + "compression_ratio": 1.6505681818181819, + "no_speech_prob": 0.14073368906974792, + "confidence": 0.709, + "words": [ + { + "text": "C'est", + "start": 0.42, + "end": 0.68, + "confidence": 0.849 + }, + { + "text": "évidence", + "start": 0.68, + "end": 0.94, + "confidence": 0.368 + }, + { + "text": "que", + "start": 0.94, + "end": 1.08, + "confidence": 0.883 + }, + { + "text": "dit", + "start": 1.08, + "end": 1.2, + "confidence": 0.343 + }, + { + "text": "Nicolas,", + "start": 1.2, + "end": 1.44, + "confidence": 0.921 + }, + { + "text": "mais", + "start": 1.88, + "end": 2.14, + "confidence": 0.914 + }, + { + "text": "je", + "start": 2.14, + "end": 2.26, + "confidence": 0.778 + }, + { + "text": "me", + "start": 2.26, + "end": 2.34, + "confidence": 0.954 + }, + { + "text": "l'étais", + "start": 2.34, + "end": 2.58, + "confidence": 0.72 + }, + { + "text": "jamais", + "start": 2.58, + "end": 2.86, + "confidence": 0.946 + }, + { + "text": "formulé", + "start": 2.86, + "end": 3.26, + "confidence": 0.53 + }, + { + "text": "comme", + "start": 3.26, + "end": 3.46, + "confidence": 0.968 + }, + { + "text": "ça.", + "start": 3.46, + "end": 3.66, + "confidence": 0.96 + } + ] + }, + { + "id": 1, + "seek": 0, + "start": 4.14, + "end": 8.9, + "text": " Ce qui fait la force du smartphone, c'est pas seulement la cumulation des fonctions, mais la manière", + "tokens": [ + 50545, + 8257, + 1956, + 3887, + 635, + 3464, + 1581, + 13307, + 11, + 269, + 6, + 377, + 1736, + 27772, + 635, + 12713, + 2776, + 730, + 17290, + 3916, + 11, + 2420, + 635, + 22267, + 50806 + ], + "temperature": 0.0, + "avg_logprob": -0.5389881480823864, + "compression_ratio": 1.6505681818181819, + "no_speech_prob": 0.14073368906974792, + "confidence": 0.789, + "words": [ + { + "text": "Ce", + "start": 4.14, + "end": 4.26, + "confidence": 0.392 + }, + { + "text": "qui", + "start": 4.26, + "end": 4.38, + "confidence": 0.94 + }, + { + "text": "fait", + "start": 4.38, + "end": 4.56, + "confidence": 0.732 + }, + { + "text": "la", + "start": 4.56, + "end": 4.72, + "confidence": 0.988 + }, + { + "text": "force", + "start": 4.72, + "end": 5.02, + "confidence": 0.93 + }, + { + "text": "du", + "start": 5.02, + "end": 5.2, + "confidence": 0.938 + }, + { + "text": "smartphone,", + "start": 5.2, + "end": 5.58, + "confidence": 0.909 + }, + { + "text": "c'est", + "start": 5.9, + "end": 6.2, + "confidence": 0.947 + }, + { + "text": "pas", + "start": 6.2, + "end": 6.26, + "confidence": 0.983 + }, + { + "text": "seulement", + "start": 6.26, + "end": 6.6, + "confidence": 0.993 + }, + { + "text": "la", + "start": 6.6, + "end": 6.8, + "confidence": 0.633 + }, + { + "text": "cumulation", + "start": 6.8, + "end": 7.34, + "confidence": 0.689 + }, + { + "text": "des", + "start": 7.34, + "end": 7.56, + "confidence": 0.792 + }, + { + "text": "fonctions,", + "start": 7.56, + "end": 8.14, + "confidence": 0.834 + }, + { + "text": "mais", + "start": 8.38, + "end": 8.5, + "confidence": 0.668 + }, + { + "text": "la", + "start": 8.5, + "end": 8.62, + "confidence": 0.719 + }, + { + "text": "manière", + "start": 8.62, + "end": 8.9, + "confidence": 0.498 + } + ] + }, + { + "id": 2, + "seek": 0, + "start": 8.9, + "end": 10.98, + "text": " dans quelques interagues entraîne.", + "tokens": [ + 50806, + 2680, + 16597, + 728, + 559, + 1247, + 22284, + 24741, + 13, + 50906 + ], + "temperature": 0.0, + "avg_logprob": -0.5389881480823864, + "compression_ratio": 1.6505681818181819, + "no_speech_prob": 0.14073368906974792, + "confidence": 0.303, + "words": [ + { + "text": "dans", + "start": 8.9, + "end": 9.06, + "confidence": 0.284 + }, + { + "text": "quelques", + "start": 9.06, + "end": 9.28, + "confidence": 0.281 + }, + { + "text": "interagues", + "start": 9.28, + "end": 10.38, + "confidence": 0.246 + }, + { + "text": "entraîne.", + "start": 10.38, + "end": 10.98, + "confidence": 0.446 + } + ] + }, + { + "id": 3, + "seek": 0, + "start": 11.0, + "end": 12.96, + "text": " Et il est d'ailleurs, c'est la photo c'est hyper convaincant.", + "tokens": [ + 50906, + 3790, + 1930, + 871, + 274, + 6, + 19400, + 11, + 269, + 6, + 377, + 635, + 5052, + 269, + 6, + 377, + 9848, + 3754, + 491, + 66, + 394, + 13, + 51006 + ], + "temperature": 0.0, + "avg_logprob": -0.5389881480823864, + "compression_ratio": 1.6505681818181819, + "no_speech_prob": 0.14073368906974792, + "confidence": 0.63, + "words": [ + { + "text": "Et", + "start": 11.0, + "end": 11.12, + "confidence": 0.36 + }, + { + "text": "il", + "start": 11.12, + "end": 11.28, + "confidence": 0.144 + }, + { + "text": "est", + "start": 11.28, + "end": 11.38, + "confidence": 0.241 + }, + { + "text": "d'ailleurs,", + "start": 11.38, + "end": 11.6, + "confidence": 0.904 + }, + { + "text": "c'est", + "start": 11.7, + "end": 11.78, + "confidence": 0.886 + }, + { + "text": "la", + "start": 11.78, + "end": 11.8, + "confidence": 0.969 + }, + { + "text": "photo", + "start": 11.8, + "end": 12.02, + "confidence": 0.809 + }, + { + "text": "c'est", + "start": 12.02, + "end": 12.26, + "confidence": 0.785 + }, + { + "text": "hyper", + "start": 12.26, + "end": 12.46, + "confidence": 0.938 + }, + { + "text": "convaincant.", + "start": 12.46, + "end": 12.96, + "confidence": 0.51 + } + ] + }, + { + "id": 4, + "seek": 0, + "start": 13.3, + "end": 18.8, + "text": " Alors évidemment, il faudrait ajouter les interfaces les grand-attachilles à été beaucoup très souvent", + "tokens": [ + 51006, + 9946, + 24724, + 11, + 1930, + 38694, + 8645, + 17680, + 23985, + 1512, + 28416, + 1512, + 2697, + 12, + 1591, + 608, + 14835, + 1531, + 8862, + 8796, + 5732, + 20847, + 51306 + ], + "temperature": 0.0, + "avg_logprob": -0.5389881480823864, + "compression_ratio": 1.6505681818181819, + "no_speech_prob": 0.14073368906974792, + "confidence": 0.532, + "words": [ + { + "text": "Alors", + "start": 13.3, + "end": 13.56, + "confidence": 0.894 + }, + { + "text": "évidemment,", + "start": 13.56, + "end": 13.82, + "confidence": 0.778 + }, + { + "text": "il", + "start": 14.38, + "end": 14.4, + "confidence": 0.964 + }, + { + "text": "faudrait", + "start": 14.4, + "end": 14.76, + "confidence": 0.856 + }, + { + "text": "ajouter", + "start": 14.76, + "end": 15.38, + "confidence": 0.883 + }, + { + "text": "les", + "start": 15.38, + "end": 15.6, + "confidence": 0.934 + }, + { + "text": "interfaces", + "start": 15.6, + "end": 16.0, + "confidence": 0.38 + }, + { + "text": "les", + "start": 16.0, + "end": 16.5, + "confidence": 0.463 + }, + { + "text": "grand-attachilles", + "start": 16.5, + "end": 17.16, + "confidence": 0.213 + }, + { + "text": "à", + "start": 17.16, + "end": 17.32, + "confidence": 0.406 + }, + { + "text": "été", + "start": 17.32, + "end": 17.72, + "confidence": 0.894 + }, + { + "text": "beaucoup", + "start": 17.72, + "end": 18.28, + "confidence": 0.797 + }, + { + "text": "très", + "start": 18.28, + "end": 18.64, + "confidence": 0.493 + }, + { + "text": "souvent", + "start": 18.64, + "end": 18.8, + "confidence": 0.822 + } + ] + }, + { + "id": 5, + "seek": 0, + "start": 18.8, + "end": 19.84, + "text": " mentionnées.", + "tokens": [ + 51306, + 2152, + 77, + 6836, + 13, + 51356 + ], + "temperature": 0.0, + "avg_logprob": -0.5389881480823864, + "compression_ratio": 1.6505681818181819, + "no_speech_prob": 0.14073368906974792, + "confidence": 0.626, + "words": [ + { + "text": "mentionnées.", + "start": 18.8, + "end": 19.84, + "confidence": 0.626 + } + ] + }, + { + "id": 6, + "seek": 0, + "start": 20.02, + "end": 23.58, + "text": " Mais bon, il faudrait que les profites aussi de 20 ans pendant l'été, les ordinateurs", + "tokens": [ + 51356, + 6313, + 4428, + 11, + 1930, + 38694, + 8645, + 631, + 1512, + 1740, + 3324, + 6212, + 368, + 945, + 1567, + 17338, + 287, + 6, + 21210, + 11, + 1512, + 4792, + 13923, + 2156, + 51543 + ], + "temperature": 0.0, + "avg_logprob": -0.5389881480823864, + "compression_ratio": 1.6505681818181819, + "no_speech_prob": 0.14073368906974792, + "confidence": 0.658, + "words": [ + { + "text": "Mais", + "start": 20.02, + "end": 20.26, + "confidence": 0.98 + }, + { + "text": "bon,", + "start": 20.26, + "end": 20.46, + "confidence": 0.568 + }, + { + "text": "il", + "start": 20.6, + "end": 20.68, + "confidence": 0.975 + }, + { + "text": "faudrait", + "start": 20.68, + "end": 20.78, + "confidence": 0.771 + }, + { + "text": "que", + "start": 20.78, + "end": 20.92, + "confidence": 0.388 + }, + { + "text": "les", + "start": 20.92, + "end": 20.96, + "confidence": 0.22 + }, + { + "text": "profites", + "start": 20.96, + "end": 21.36, + "confidence": 0.57 + }, + { + "text": "aussi", + "start": 21.36, + "end": 21.72, + "confidence": 0.52 + }, + { + "text": "de", + "start": 21.72, + "end": 21.92, + "confidence": 0.492 + }, + { + "text": "20", + "start": 21.92, + "end": 22.14, + "confidence": 0.915 + }, + { + "text": "ans", + "start": 22.14, + "end": 22.32, + "confidence": 0.942 + }, + { + "text": "pendant", + "start": 22.32, + "end": 22.52, + "confidence": 0.916 + }, + { + "text": "l'été,", + "start": 22.52, + "end": 22.86, + "confidence": 0.48 + }, + { + "text": "les", + "start": 22.98, + "end": 23.1, + "confidence": 0.903 + }, + { + "text": "ordinateurs", + "start": 23.1, + "end": 23.58, + "confidence": 0.946 + } + ] + }, + { + "id": 7, + "seek": 0, + "start": 23.58, + "end": 28.07, + "text": " nous ont appris à piquer sur des icônes, sauf que, alors le smartphone ajoute le toucher,", + "tokens": [ + 51543, + 4666, + 6592, + 724, + 5714, + 1531, + 280, + 23909, + 1022, + 730, + 4376, + 2851, + 4081, + 11, + 601, + 2947, + 631, + 11, + 11246, + 476, + 13307, + 17680, + 14040, + 476, + 2557, + 260, + 11, + 51766 + ], + "temperature": 0.0, + "avg_logprob": -0.5389881480823864, + "compression_ratio": 1.6505681818181819, + "no_speech_prob": 0.14073368906974792, + "confidence": 0.656, + "words": [ + { + "text": "nous", + "start": 23.58, + "end": 23.78, + "confidence": 0.767 + }, + { + "text": "ont", + "start": 23.78, + "end": 23.9, + "confidence": 0.98 + }, + { + "text": "appris", + "start": 23.9, + "end": 24.12, + "confidence": 0.952 + }, + { + "text": "à", + "start": 24.12, + "end": 24.26, + "confidence": 0.34 + }, + { + "text": "piquer", + "start": 24.26, + "end": 24.54, + "confidence": 0.449 + }, + { + "text": "sur", + "start": 24.54, + "end": 24.72, + "confidence": 0.816 + }, + { + "text": "des", + "start": 24.72, + "end": 24.9, + "confidence": 0.96 + }, + { + "text": "icônes,", + "start": 24.9, + "end": 25.56, + "confidence": 0.599 + }, + { + "text": "sauf", + "start": 25.64, + "end": 25.8, + "confidence": 0.522 + }, + { + "text": "que,", + "start": 25.8, + "end": 26.36, + "confidence": 0.915 + }, + { + "text": "alors", + "start": 26.36, + "end": 26.58, + "confidence": 0.396 + }, + { + "text": "le", + "start": 26.58, + "end": 26.72, + "confidence": 0.824 + }, + { + "text": "smartphone", + "start": 26.72, + "end": 27.0, + "confidence": 0.977 + }, + { + "text": "ajoute", + "start": 27.0, + "end": 27.5, + "confidence": 0.674 + }, + { + "text": "le", + "start": 27.5, + "end": 27.62, + "confidence": 0.552 + }, + { + "text": "toucher,", + "start": 27.62, + "end": 28.07, + "confidence": 0.631 + } + ] + }, + { + "id": 8, + "seek": 2804, + "start": 28.07, + "end": 30.6, + "text": " qui rend le contact plus direct, plus sensible.", + "tokens": [ + 50364, + 1956, + 6125, + 476, + 3385, + 1804, + 2047, + 11, + 1804, + 25380, + 13, + 50496 + ], + "temperature": 0.0, + "avg_logprob": -0.4256427271836469, + "compression_ratio": 1.7156549520766773, + "no_speech_prob": 0.12921307981014252, + "confidence": 0.742, + "words": [ + { + "text": "qui", + "start": 28.07, + "end": 28.26, + "confidence": 0.305 + }, + { + "text": "rend", + "start": 28.26, + "end": 28.5, + "confidence": 0.763 + }, + { + "text": "le", + "start": 28.5, + "end": 28.72, + "confidence": 0.988 + }, + { + "text": "contact", + "start": 28.72, + "end": 29.06, + "confidence": 0.817 + }, + { + "text": "plus", + "start": 29.06, + "end": 29.48, + "confidence": 0.84 + }, + { + "text": "direct,", + "start": 29.48, + "end": 30.02, + "confidence": 0.944 + }, + { + "text": "plus", + "start": 30.18, + "end": 30.24, + "confidence": 0.992 + }, + { + "text": "sensible.", + "start": 30.24, + "end": 30.6, + "confidence": 0.618 + } + ] + }, + { + "id": 9, + "seek": 2804, + "start": 31.1, + "end": 34.76, + "text": " Et puis, évidemment, il faudrait parler aussi des applications qui permettent de contourner le côté", + "tokens": [ + 50496, + 3790, + 9093, + 11, + 24724, + 11, + 1930, + 38694, + 8645, + 16421, + 6212, + 730, + 5821, + 1956, + 21540, + 317, + 368, + 21234, + 1193, + 476, + 18437, + 50698 + ], + "temperature": 0.0, + "avg_logprob": -0.4256427271836469, + "compression_ratio": 1.7156549520766773, + "no_speech_prob": 0.12921307981014252, + "confidence": 0.777, + "words": [ + { + "text": "Et", + "start": 31.1, + "end": 31.24, + "confidence": 0.949 + }, + { + "text": "puis,", + "start": 31.24, + "end": 31.36, + "confidence": 0.721 + }, + { + "text": "évidemment,", + "start": 31.42, + "end": 31.62, + "confidence": 0.213 + }, + { + "text": "il", + "start": 31.7, + "end": 31.76, + "confidence": 0.959 + }, + { + "text": "faudrait", + "start": 31.76, + "end": 31.94, + "confidence": 0.994 + }, + { + "text": "parler", + "start": 31.94, + "end": 32.14, + "confidence": 0.847 + }, + { + "text": "aussi", + "start": 32.14, + "end": 32.36, + "confidence": 0.925 + }, + { + "text": "des", + "start": 32.36, + "end": 32.46, + "confidence": 0.921 + }, + { + "text": "applications", + "start": 32.46, + "end": 32.88, + "confidence": 0.857 + }, + { + "text": "qui", + "start": 32.88, + "end": 33.2, + "confidence": 0.663 + }, + { + "text": "permettent", + "start": 33.2, + "end": 33.8, + "confidence": 0.952 + }, + { + "text": "de", + "start": 33.8, + "end": 33.96, + "confidence": 0.951 + }, + { + "text": "contourner", + "start": 33.96, + "end": 34.4, + "confidence": 0.721 + }, + { + "text": "le", + "start": 34.4, + "end": 34.52, + "confidence": 0.654 + }, + { + "text": "côté", + "start": 34.52, + "end": 34.76, + "confidence": 0.641 + } + ] + }, + { + "id": 10, + "seek": 2804, + "start": 34.8, + "end": 37.86, + "text": " tout flu de la navigation web pour aller directement en but.", + "tokens": [ + 50698, + 3486, + 5029, + 368, + 635, + 17346, + 3670, + 2016, + 8722, + 37297, + 465, + 457, + 13, + 50860 + ], + "temperature": 0.0, + "avg_logprob": -0.4256427271836469, + "compression_ratio": 1.7156549520766773, + "no_speech_prob": 0.12921307981014252, + "confidence": 0.735, + "words": [ + { + "text": "tout", + "start": 34.8, + "end": 35.04, + "confidence": 0.945 + }, + { + "text": "flu", + "start": 35.04, + "end": 35.32, + "confidence": 0.484 + }, + { + "text": "de", + "start": 35.32, + "end": 35.64, + "confidence": 0.35 + }, + { + "text": "la", + "start": 35.64, + "end": 35.78, + "confidence": 0.921 + }, + { + "text": "navigation", + "start": 35.78, + "end": 36.24, + "confidence": 0.903 + }, + { + "text": "web", + "start": 36.24, + "end": 36.64, + "confidence": 0.913 + }, + { + "text": "pour", + "start": 36.64, + "end": 36.84, + "confidence": 0.57 + }, + { + "text": "aller", + "start": 36.84, + "end": 37.06, + "confidence": 0.991 + }, + { + "text": "directement", + "start": 37.06, + "end": 37.48, + "confidence": 0.981 + }, + { + "text": "en", + "start": 37.48, + "end": 37.7, + "confidence": 0.654 + }, + { + "text": "but.", + "start": 37.7, + "end": 37.86, + "confidence": 0.768 + } + ] + }, + { + "id": 11, + "seek": 2804, + "start": 38.78, + "end": 43.12, + "text": " Bref, tout ça, ce sont les conditions qui permettent de créer cette objet, en Nicolas,", + "tokens": [ + 50860, + 49957, + 11, + 3486, + 2788, + 11, + 1769, + 4900, + 1512, + 4487, + 1956, + 21540, + 317, + 368, + 32062, + 5550, + 14964, + 11, + 465, + 38268, + 11, + 51121 + ], + "temperature": 0.0, + "avg_logprob": -0.4256427271836469, + "compression_ratio": 1.7156549520766773, + "no_speech_prob": 0.12921307981014252, + "confidence": 0.737, + "words": [ + { + "text": "Bref,", + "start": 38.78, + "end": 38.8, + "confidence": 0.972 + }, + { + "text": "tout", + "start": 38.84, + "end": 39.04, + "confidence": 0.817 + }, + { + "text": "ça,", + "start": 39.04, + "end": 39.46, + "confidence": 0.984 + }, + { + "text": "ce", + "start": 39.54, + "end": 39.76, + "confidence": 0.905 + }, + { + "text": "sont", + "start": 39.76, + "end": 39.96, + "confidence": 0.98 + }, + { + "text": "les", + "start": 39.96, + "end": 40.1, + "confidence": 0.982 + }, + { + "text": "conditions", + "start": 40.1, + "end": 40.64, + "confidence": 0.956 + }, + { + "text": "qui", + "start": 40.64, + "end": 40.96, + "confidence": 0.995 + }, + { + "text": "permettent", + "start": 40.96, + "end": 41.58, + "confidence": 0.994 + }, + { + "text": "de", + "start": 41.58, + "end": 41.64, + "confidence": 0.993 + }, + { + "text": "créer", + "start": 41.64, + "end": 42.08, + "confidence": 0.91 + }, + { + "text": "cette", + "start": 42.08, + "end": 42.34, + "confidence": 0.473 + }, + { + "text": "objet,", + "start": 42.34, + "end": 42.64, + "confidence": 0.235 + }, + { + "text": "en", + "start": 42.7, + "end": 42.84, + "confidence": 0.221 + }, + { + "text": "Nicolas,", + "start": 42.84, + "end": 43.12, + "confidence": 0.537 + } + ] + }, + { + "id": 12, + "seek": 2804, + "start": 43.12, + "end": 46.58, + "text": " dit qu'il est très symbolablement inédit dans l'histoire de l'humanité.", + "tokens": [ + 51121, + 6176, + 421, + 6, + 388, + 871, + 5732, + 5986, + 712, + 518, + 294, + 7811, + 270, + 2680, + 287, + 6, + 29093, + 368, + 287, + 6, + 18796, + 5066, + 13, + 51290 + ], + "temperature": 0.0, + "avg_logprob": -0.4256427271836469, + "compression_ratio": 1.7156549520766773, + "no_speech_prob": 0.12921307981014252, + "confidence": 0.717, + "words": [ + { + "text": "dit", + "start": 43.12, + "end": 43.56, + "confidence": 0.696 + }, + { + "text": "qu'il", + "start": 43.56, + "end": 43.76, + "confidence": 0.958 + }, + { + "text": "est", + "start": 43.76, + "end": 43.9, + "confidence": 0.849 + }, + { + "text": "très", + "start": 43.9, + "end": 44.08, + "confidence": 0.443 + }, + { + "text": "symbolablement", + "start": 44.08, + "end": 44.86, + "confidence": 0.321 + }, + { + "text": "inédit", + "start": 44.86, + "end": 45.54, + "confidence": 0.655 + }, + { + "text": "dans", + "start": 45.54, + "end": 45.74, + "confidence": 0.817 + }, + { + "text": "l'histoire", + "start": 45.74, + "end": 46.02, + "confidence": 0.824 + }, + { + "text": "de", + "start": 46.02, + "end": 46.14, + "confidence": 0.983 + }, + { + "text": "l'humanité.", + "start": 46.14, + "end": 46.58, + "confidence": 0.99 + } + ] + }, + { + "id": 13, + "seek": 2804, + "start": 47.06, + "end": 48.76, + "text": " Mais ça s'assoulait d'une autre interrogation.", + "tokens": [ + 51290, + 6313, + 2788, + 262, + 6, + 640, + 263, + 35235, + 274, + 6, + 2613, + 15081, + 24871, + 399, + 13, + 51402 + ], + "temperature": 0.0, + "avg_logprob": -0.4256427271836469, + "compression_ratio": 1.7156549520766773, + "no_speech_prob": 0.12921307981014252, + "confidence": 0.717, + "words": [ + { + "text": "Mais", + "start": 47.06, + "end": 47.24, + "confidence": 0.928 + }, + { + "text": "ça", + "start": 47.24, + "end": 47.48, + "confidence": 0.75 + }, + { + "text": "s'assoulait", + "start": 47.48, + "end": 47.84, + "confidence": 0.616 + }, + { + "text": "d'une", + "start": 47.84, + "end": 48.08, + "confidence": 0.674 + }, + { + "text": "autre", + "start": 48.08, + "end": 48.18, + "confidence": 0.964 + }, + { + "text": "interrogation.", + "start": 48.18, + "end": 48.76, + "confidence": 0.855 + } + ] + }, + { + "id": 14, + "seek": 2804, + "start": 49.42, + "end": 54.93, + "text": " Est-ce que le fait que cette objet soit inédit un d'huits que notre rapport a lui est aussi un rapport", + "tokens": [ + 51402, + 4410, + 12, + 384, + 631, + 476, + 3887, + 631, + 5550, + 14964, + 12703, + 294, + 7811, + 270, + 517, + 274, + 6, + 12086, + 1208, + 631, + 10349, + 18018, + 257, + 8783, + 871, + 6212, + 517, + 18018, + 51710 + ], + "temperature": 0.0, + "avg_logprob": -0.4256427271836469, + "compression_ratio": 1.7156549520766773, + "no_speech_prob": 0.12921307981014252, + "confidence": 0.704, + "words": [ + { + "text": "Est-ce", + "start": 49.42, + "end": 49.7, + "confidence": 0.919 + }, + { + "text": "que", + "start": 49.7, + "end": 49.74, + "confidence": 0.99 + }, + { + "text": "le", + "start": 49.74, + "end": 49.82, + "confidence": 0.871 + }, + { + "text": "fait", + "start": 49.82, + "end": 50.02, + "confidence": 0.945 + }, + { + "text": "que", + "start": 50.02, + "end": 50.16, + "confidence": 0.923 + }, + { + "text": "cette", + "start": 50.16, + "end": 50.3, + "confidence": 0.943 + }, + { + "text": "objet", + "start": 50.3, + "end": 50.64, + "confidence": 0.963 + }, + { + "text": "soit", + "start": 50.64, + "end": 51.1, + "confidence": 0.99 + }, + { + "text": "inédit", + "start": 51.1, + "end": 51.82, + "confidence": 0.928 + }, + { + "text": "un", + "start": 51.82, + "end": 52.08, + "confidence": 0.511 + }, + { + "text": "d'huits", + "start": 52.08, + "end": 52.34, + "confidence": 0.246 + }, + { + "text": "que", + "start": 52.34, + "end": 52.44, + "confidence": 0.974 + }, + { + "text": "notre", + "start": 52.44, + "end": 52.66, + "confidence": 0.992 + }, + { + "text": "rapport", + "start": 52.66, + "end": 53.24, + "confidence": 0.779 + }, + { + "text": "a", + "start": 53.24, + "end": 53.5, + "confidence": 0.57 + }, + { + "text": "lui", + "start": 53.5, + "end": 53.7, + "confidence": 0.701 + }, + { + "text": "est", + "start": 53.7, + "end": 54.04, + "confidence": 0.879 + }, + { + "text": "aussi", + "start": 54.04, + "end": 54.52, + "confidence": 0.815 + }, + { + "text": "un", + "start": 54.52, + "end": 54.7, + "confidence": 0.48 + }, + { + "text": "rapport", + "start": 54.7, + "end": 54.93, + "confidence": 0.952 + } + ] + }, + { + "id": 15, + "seek": 2804, + "start": 54.93, + "end": 55.88, + "text": " inédit ?", + "tokens": [ + 51710, + 294, + 7811, + 270, + 2506, + 51760 + ], + "temperature": 0.0, + "avg_logprob": -0.4256427271836469, + "compression_ratio": 1.7156549520766773, + "no_speech_prob": 0.12921307981014252, + "confidence": 0.86, + "words": [ + { + "text": "inédit ?", + "start": 54.93, + "end": 55.88, + "confidence": 0.86 + } + ] + }, + { + "id": 16, + "seek": 5596, + "start": 55.96, + "end": 59.36, + "text": " Est-ce que le rapport qu'on a au sein de foi n'est comparable à celui qu'on entretenait", + "tokens": [ + 50364, + 4410, + 12, + 384, + 631, + 476, + 18018, + 421, + 6, + 266, + 257, + 1609, + 6195, + 368, + 6901, + 297, + 6, + 377, + 25323, + 1531, + 22829, + 421, + 6, + 266, + 3962, + 1147, + 1001, + 50530 + ], + "temperature": 0.0, + "avg_logprob": -0.6293370928083147, + "compression_ratio": 1.5749128919860627, + "no_speech_prob": 0.21948836743831635, + "confidence": 0.62, + "words": [ + { + "text": "Est-ce", + "start": 55.96, + "end": 56.38, + "confidence": 0.553 + }, + { + "text": "que", + "start": 56.38, + "end": 56.44, + "confidence": 0.892 + }, + { + "text": "le", + "start": 56.44, + "end": 56.58, + "confidence": 0.982 + }, + { + "text": "rapport", + "start": 56.58, + "end": 56.9, + "confidence": 0.999 + }, + { + "text": "qu'on", + "start": 56.9, + "end": 57.14, + "confidence": 0.902 + }, + { + "text": "a", + "start": 57.14, + "end": 57.2, + "confidence": 0.959 + }, + { + "text": "au", + "start": 57.2, + "end": 57.28, + "confidence": 0.273 + }, + { + "text": "sein", + "start": 57.28, + "end": 57.42, + "confidence": 0.17 + }, + { + "text": "de", + "start": 57.42, + "end": 57.56, + "confidence": 0.229 + }, + { + "text": "foi", + "start": 57.56, + "end": 57.58, + "confidence": 0.121 + }, + { + "text": "n'est", + "start": 57.58, + "end": 57.78, + "confidence": 0.79 + }, + { + "text": "comparable", + "start": 57.78, + "end": 58.28, + "confidence": 0.547 + }, + { + "text": "à", + "start": 58.28, + "end": 58.48, + "confidence": 0.934 + }, + { + "text": "celui", + "start": 58.48, + "end": 58.7, + "confidence": 0.851 + }, + { + "text": "qu'on", + "start": 58.7, + "end": 58.94, + "confidence": 0.926 + }, + { + "text": "entretenait", + "start": 58.94, + "end": 59.36, + "confidence": 0.56 + } + ] + }, + { + "id": 17, + "seek": 5596, + "start": 59.36, + "end": 63.14, + "text": " à d'autres objectes techniques comme la voiture ou le téléphone ?", + "tokens": [ + 50530, + 1531, + 274, + 6, + 16752, + 2657, + 279, + 7512, + 5173, + 635, + 38859, + 2820, + 476, + 47159, + 2506, + 50714 + ], + "temperature": 0.0, + "avg_logprob": -0.6293370928083147, + "compression_ratio": 1.5749128919860627, + "no_speech_prob": 0.21948836743831635, + "confidence": 0.756, + "words": [ + { + "text": "à", + "start": 59.36, + "end": 59.44, + "confidence": 0.951 + }, + { + "text": "d'autres", + "start": 59.44, + "end": 59.68, + "confidence": 0.857 + }, + { + "text": "objectes", + "start": 59.68, + "end": 60.02, + "confidence": 0.507 + }, + { + "text": "techniques", + "start": 60.02, + "end": 60.44, + "confidence": 0.462 + }, + { + "text": "comme", + "start": 60.44, + "end": 61.04, + "confidence": 0.639 + }, + { + "text": "la", + "start": 61.04, + "end": 61.52, + "confidence": 0.905 + }, + { + "text": "voiture", + "start": 61.52, + "end": 61.86, + "confidence": 0.946 + }, + { + "text": "ou", + "start": 61.86, + "end": 62.46, + "confidence": 0.755 + }, + { + "text": "le", + "start": 62.46, + "end": 62.68, + "confidence": 0.913 + }, + { + "text": "téléphone ?", + "start": 62.68, + "end": 63.14, + "confidence": 0.983 + } + ] + }, + { + "id": 18, + "seek": 5596, + "start": 65.4, + "end": 66.16, + "text": " Il n'y a pas d'équivalent.", + "tokens": [ + 50714, + 4416, + 297, + 6, + 88, + 257, + 1736, + 274, + 6, + 20183, + 3576, + 317, + 13, + 50872 + ], + "temperature": 0.0, + "avg_logprob": -0.6293370928083147, + "compression_ratio": 1.5749128919860627, + "no_speech_prob": 0.21948836743831635, + "confidence": 0.881, + "words": [ + { + "text": "Il", + "start": 65.4, + "end": 65.5, + "confidence": 0.901 + }, + { + "text": "n'y", + "start": 65.5, + "end": 65.54, + "confidence": 0.86 + }, + { + "text": "a", + "start": 65.54, + "end": 65.56, + "confidence": 0.962 + }, + { + "text": "pas", + "start": 65.56, + "end": 65.68, + "confidence": 0.998 + }, + { + "text": "d'équivalent.", + "start": 65.68, + "end": 66.16, + "confidence": 0.852 + } + ] + }, + { + "id": 19, + "seek": 5596, + "start": 66.16, + "end": 69.92, + "text": " On s'est espèrent de nous voter dans la relation à l'objet.", + "tokens": [ + 50872, + 1282, + 262, + 6, + 377, + 7089, + 1462, + 1753, + 368, + 4666, + 21722, + 2680, + 635, + 9721, + 1531, + 287, + 6, + 996, + 7108, + 13, + 51058 + ], + "temperature": 0.0, + "avg_logprob": -0.6293370928083147, + "compression_ratio": 1.5749128919860627, + "no_speech_prob": 0.21948836743831635, + "confidence": 0.501, + "words": [ + { + "text": "On", + "start": 66.16, + "end": 67.08, + "confidence": 0.302 + }, + { + "text": "s'est", + "start": 67.08, + "end": 67.3, + "confidence": 0.563 + }, + { + "text": "espèrent", + "start": 67.3, + "end": 67.62, + "confidence": 0.134 + }, + { + "text": "de", + "start": 67.62, + "end": 67.66, + "confidence": 0.99 + }, + { + "text": "nous", + "start": 67.66, + "end": 67.84, + "confidence": 0.763 + }, + { + "text": "voter", + "start": 67.84, + "end": 68.36, + "confidence": 0.181 + }, + { + "text": "dans", + "start": 68.36, + "end": 68.86, + "confidence": 0.82 + }, + { + "text": "la", + "start": 68.86, + "end": 68.96, + "confidence": 0.617 + }, + { + "text": "relation", + "start": 68.96, + "end": 69.24, + "confidence": 0.949 + }, + { + "text": "à", + "start": 69.24, + "end": 69.42, + "confidence": 0.75 + }, + { + "text": "l'objet.", + "start": 69.42, + "end": 69.92, + "confidence": 0.887 + } + ] + }, + { + "id": 20, + "seek": 5596, + "start": 70.2, + "end": 71.22, + "text": " C'est facilement éterricion.", + "tokens": [ + 51058, + 383, + 6, + 377, + 23670, + 518, + 1136, + 391, + 1341, + 313, + 13, + 51122 + ], + "temperature": 0.0, + "avg_logprob": -0.6293370928083147, + "compression_ratio": 1.5749128919860627, + "no_speech_prob": 0.21948836743831635, + "confidence": 0.441, + "words": [ + { + "text": "C'est", + "start": 70.2, + "end": 70.34, + "confidence": 0.895 + }, + { + "text": "facilement", + "start": 70.34, + "end": 70.7, + "confidence": 0.562 + }, + { + "text": "éterricion.", + "start": 70.7, + "end": 71.22, + "confidence": 0.23 + } + ] + }, + { + "id": 21, + "seek": 5596, + "start": 71.64, + "end": 76.97, + "text": " Parce que la passion de l'utilisateur et ses affices a dépendance, cette objet d'un lieu", + "tokens": [ + 51122, + 20429, + 631, + 635, + 5418, + 368, + 287, + 6, + 20835, + 271, + 15540, + 1030, + 5385, + 2096, + 1473, + 257, + 45768, + 719, + 11, + 5550, + 14964, + 274, + 6, + 409, + 26036, + 51416 + ], + "temperature": 0.0, + "avg_logprob": -0.6293370928083147, + "compression_ratio": 1.5749128919860627, + "no_speech_prob": 0.21948836743831635, + "confidence": 0.457, + "words": [ + { + "text": "Parce", + "start": 71.64, + "end": 71.94, + "confidence": 0.679 + }, + { + "text": "que", + "start": 71.94, + "end": 72.32, + "confidence": 0.566 + }, + { + "text": "la", + "start": 72.32, + "end": 72.56, + "confidence": 0.336 + }, + { + "text": "passion", + "start": 72.56, + "end": 72.9, + "confidence": 0.267 + }, + { + "text": "de", + "start": 72.9, + "end": 73.24, + "confidence": 0.365 + }, + { + "text": "l'utilisateur", + "start": 73.24, + "end": 74.82, + "confidence": 0.499 + }, + { + "text": "et", + "start": 74.82, + "end": 74.92, + "confidence": 0.45 + }, + { + "text": "ses", + "start": 74.92, + "end": 75.04, + "confidence": 0.095 + }, + { + "text": "affices", + "start": 75.04, + "end": 75.24, + "confidence": 0.303 + }, + { + "text": "a", + "start": 75.24, + "end": 75.38, + "confidence": 0.59 + }, + { + "text": "dépendance,", + "start": 75.38, + "end": 76.06, + "confidence": 0.559 + }, + { + "text": "cette", + "start": 76.32, + "end": 76.34, + "confidence": 0.401 + }, + { + "text": "objet", + "start": 76.34, + "end": 76.54, + "confidence": 0.924 + }, + { + "text": "d'un", + "start": 76.54, + "end": 76.92, + "confidence": 0.783 + }, + { + "text": "lieu", + "start": 76.92, + "end": 76.97, + "confidence": 0.307 + } + ] + }, + { + "id": 22, + "seek": 5596, + "start": 76.97, + "end": 82.15, + "text": " en fait, une espèce de relation de médiation avec le monde qui rendent encore avec", + "tokens": [ + 51416, + 465, + 3887, + 11, + 2251, + 7089, + 30236, + 368, + 9721, + 368, + 42436, + 399, + 4163, + 476, + 10431, + 1956, + 6125, + 317, + 10122, + 4163, + 51671 + ], + "temperature": 0.0, + "avg_logprob": -0.6293370928083147, + "compression_ratio": 1.5749128919860627, + "no_speech_prob": 0.21948836743831635, + "confidence": 0.746, + "words": [ + { + "text": "en", + "start": 76.97, + "end": 77.2, + "confidence": 0.767 + }, + { + "text": "fait,", + "start": 77.2, + "end": 77.32, + "confidence": 0.944 + }, + { + "text": "une", + "start": 77.46, + "end": 77.48, + "confidence": 0.696 + }, + { + "text": "espèce", + "start": 77.48, + "end": 77.9, + "confidence": 0.97 + }, + { + "text": "de", + "start": 77.9, + "end": 78.08, + "confidence": 0.994 + }, + { + "text": "relation", + "start": 78.08, + "end": 78.5, + "confidence": 0.826 + }, + { + "text": "de", + "start": 78.5, + "end": 78.94, + "confidence": 0.72 + }, + { + "text": "médiation", + "start": 78.94, + "end": 79.5, + "confidence": 0.881 + }, + { + "text": "avec", + "start": 79.5, + "end": 79.74, + "confidence": 0.968 + }, + { + "text": "le", + "start": 79.74, + "end": 79.94, + "confidence": 0.986 + }, + { + "text": "monde", + "start": 79.94, + "end": 80.44, + "confidence": 0.906 + }, + { + "text": "qui", + "start": 80.44, + "end": 81.14, + "confidence": 0.825 + }, + { + "text": "rendent", + "start": 81.14, + "end": 81.8, + "confidence": 0.584 + }, + { + "text": "encore", + "start": 81.8, + "end": 81.98, + "confidence": 0.198 + }, + { + "text": "avec", + "start": 81.98, + "end": 82.15, + "confidence": 0.486 + } + ] + }, + { + "id": 23, + "seek": 8210, + "start": 82.15, + "end": 83.44, + "text": " la maille de celles formes de rogeur.", + "tokens": [ + 50364, + 635, + 463, + 3409, + 368, + 2815, + 279, + 1254, + 279, + 368, + 744, + 432, + 374, + 13, + 50440 + ], + "temperature": 0.0, + "avg_logprob": -0.45904387403654573, + "compression_ratio": 1.6159169550173011, + "no_speech_prob": 0.2066797912120819, + "confidence": 0.465, + "words": [ + { + "text": "la", + "start": 82.15, + "end": 82.22, + "confidence": 0.648 + }, + { + "text": "maille", + "start": 82.22, + "end": 82.4, + "confidence": 0.136 + }, + { + "text": "de", + "start": 82.4, + "end": 82.48, + "confidence": 0.585 + }, + { + "text": "celles", + "start": 82.48, + "end": 82.74, + "confidence": 0.561 + }, + { + "text": "formes", + "start": 82.74, + "end": 82.96, + "confidence": 0.78 + }, + { + "text": "de", + "start": 82.96, + "end": 83.0, + "confidence": 0.936 + }, + { + "text": "rogeur.", + "start": 83.0, + "end": 83.44, + "confidence": 0.433 + } + ] + }, + { + "id": 24, + "seek": 8210, + "start": 83.98, + "end": 87.86, + "text": " Donc, à objets inédits, rapport inédits.", + "tokens": [ + 50440, + 7477, + 11, + 1531, + 1111, + 25349, + 294, + 7811, + 1208, + 11, + 18018, + 294, + 7811, + 1208, + 13, + 50640 + ], + "temperature": 0.0, + "avg_logprob": -0.45904387403654573, + "compression_ratio": 1.6159169550173011, + "no_speech_prob": 0.2066797912120819, + "confidence": 0.745, + "words": [ + { + "text": "Donc,", + "start": 83.98, + "end": 84.46, + "confidence": 0.833 + }, + { + "text": "à", + "start": 84.56, + "end": 84.96, + "confidence": 0.696 + }, + { + "text": "objets", + "start": 84.96, + "end": 85.44, + "confidence": 0.526 + }, + { + "text": "inédits,", + "start": 85.44, + "end": 86.24, + "confidence": 0.701 + }, + { + "text": "rapport", + "start": 86.32, + "end": 86.92, + "confidence": 0.944 + }, + { + "text": "inédits.", + "start": 86.92, + "end": 87.86, + "confidence": 0.908 + } + ] + }, + { + "id": 25, + "seek": 8210, + "start": 88.1, + "end": 94.2, + "text": " Et, ce rapport, si j'en prends Nicolas, frère caractérisée par un mélange de dépendance", + "tokens": [ + 50640, + 3790, + 11, + 1769, + 18018, + 11, + 1511, + 361, + 6, + 268, + 46750, + 38268, + 11, + 431, + 4212, + 1032, + 578, + 4198, + 50027, + 971, + 517, + 41953, + 933, + 368, + 45768, + 719, + 50972 + ], + "temperature": 0.0, + "avg_logprob": -0.45904387403654573, + "compression_ratio": 1.6159169550173011, + "no_speech_prob": 0.2066797912120819, + "confidence": 0.669, + "words": [ + { + "text": "Et,", + "start": 88.1, + "end": 88.3, + "confidence": 0.865 + }, + { + "text": "ce", + "start": 88.58, + "end": 88.84, + "confidence": 0.277 + }, + { + "text": "rapport,", + "start": 88.84, + "end": 89.28, + "confidence": 0.998 + }, + { + "text": "si", + "start": 89.38, + "end": 89.56, + "confidence": 0.933 + }, + { + "text": "j'en", + "start": 89.56, + "end": 89.74, + "confidence": 0.78 + }, + { + "text": "prends", + "start": 89.74, + "end": 89.92, + "confidence": 0.307 + }, + { + "text": "Nicolas,", + "start": 89.92, + "end": 90.22, + "confidence": 0.65 + }, + { + "text": "frère", + "start": 90.78, + "end": 91.1, + "confidence": 0.431 + }, + { + "text": "caractérisée", + "start": 91.1, + "end": 91.8, + "confidence": 0.595 + }, + { + "text": "par", + "start": 91.8, + "end": 92.14, + "confidence": 0.907 + }, + { + "text": "un", + "start": 92.14, + "end": 92.34, + "confidence": 0.989 + }, + { + "text": "mélange", + "start": 92.34, + "end": 92.98, + "confidence": 0.92 + }, + { + "text": "de", + "start": 92.98, + "end": 93.24, + "confidence": 0.842 + }, + { + "text": "dépendance", + "start": 93.24, + "end": 94.2, + "confidence": 0.675 + } + ] + }, + { + "id": 26, + "seek": 8210, + "start": 94.36, + "end": 95.08, + "text": " et de rogeur.", + "tokens": [ + 50972, + 1030, + 368, + 744, + 432, + 374, + 13, + 51022 + ], + "temperature": 0.0, + "avg_logprob": -0.45904387403654573, + "compression_ratio": 1.6159169550173011, + "no_speech_prob": 0.2066797912120819, + "confidence": 0.851, + "words": [ + { + "text": "et", + "start": 94.36, + "end": 94.52, + "confidence": 0.97 + }, + { + "text": "de", + "start": 94.52, + "end": 94.64, + "confidence": 0.996 + }, + { + "text": "rogeur.", + "start": 94.64, + "end": 95.08, + "confidence": 0.773 + } + ] + }, + { + "id": 27, + "seek": 8210, + "start": 96.3, + "end": 100.48, + "text": " Bon, en vrai, il faudrait remonter très, très filmant tout l'histoire des objectes", + "tokens": [ + 51022, + 7368, + 11, + 465, + 17815, + 11, + 1930, + 38694, + 8645, + 890, + 41806, + 5732, + 11, + 5732, + 2007, + 394, + 3486, + 287, + 6, + 29093, + 730, + 2657, + 279, + 51286 + ], + "temperature": 0.0, + "avg_logprob": -0.45904387403654573, + "compression_ratio": 1.6159169550173011, + "no_speech_prob": 0.2066797912120819, + "confidence": 0.752, + "words": [ + { + "text": "Bon,", + "start": 96.3, + "end": 96.32, + "confidence": 0.6 + }, + { + "text": "en", + "start": 96.36, + "end": 96.58, + "confidence": 0.918 + }, + { + "text": "vrai,", + "start": 96.58, + "end": 96.92, + "confidence": 0.992 + }, + { + "text": "il", + "start": 97.14, + "end": 97.18, + "confidence": 0.987 + }, + { + "text": "faudrait", + "start": 97.18, + "end": 97.56, + "confidence": 0.933 + }, + { + "text": "remonter", + "start": 97.56, + "end": 98.08, + "confidence": 0.61 + }, + { + "text": "très,", + "start": 98.08, + "end": 98.56, + "confidence": 0.975 + }, + { + "text": "très", + "start": 98.56, + "end": 98.86, + "confidence": 0.986 + }, + { + "text": "filmant", + "start": 98.86, + "end": 99.42, + "confidence": 0.409 + }, + { + "text": "tout", + "start": 99.42, + "end": 99.68, + "confidence": 0.348 + }, + { + "text": "l'histoire", + "start": 99.68, + "end": 100.08, + "confidence": 0.876 + }, + { + "text": "des", + "start": 100.08, + "end": 100.22, + "confidence": 0.957 + }, + { + "text": "objectes", + "start": 100.22, + "end": 100.48, + "confidence": 0.842 + } + ] + }, + { + "id": 28, + "seek": 8210, + "start": 100.48, + "end": 105.24, + "text": " techniques et de leur infertion dans nos vieux pour déterminer si ce rapport est totalement", + "tokens": [ + 51286, + 7512, + 1030, + 368, + 9580, + 1536, + 911, + 313, + 2680, + 3269, + 4941, + 2449, + 2016, + 2795, + 29725, + 260, + 1511, + 1769, + 18018, + 871, + 45203, + 51530 + ], + "temperature": 0.0, + "avg_logprob": -0.45904387403654573, + "compression_ratio": 1.6159169550173011, + "no_speech_prob": 0.2066797912120819, + "confidence": 0.614, + "words": [ + { + "text": "techniques", + "start": 100.48, + "end": 101.0, + "confidence": 0.952 + }, + { + "text": "et", + "start": 101.0, + "end": 101.58, + "confidence": 0.943 + }, + { + "text": "de", + "start": 101.58, + "end": 101.72, + "confidence": 0.975 + }, + { + "text": "leur", + "start": 101.72, + "end": 101.8, + "confidence": 0.803 + }, + { + "text": "infertion", + "start": 101.8, + "end": 102.34, + "confidence": 0.382 + }, + { + "text": "dans", + "start": 102.34, + "end": 102.5, + "confidence": 0.297 + }, + { + "text": "nos", + "start": 102.5, + "end": 102.68, + "confidence": 0.419 + }, + { + "text": "vieux", + "start": 102.68, + "end": 103.08, + "confidence": 0.386 + }, + { + "text": "pour", + "start": 103.08, + "end": 103.1, + "confidence": 0.281 + }, + { + "text": "déterminer", + "start": 103.1, + "end": 103.64, + "confidence": 0.976 + }, + { + "text": "si", + "start": 103.64, + "end": 103.8, + "confidence": 0.367 + }, + { + "text": "ce", + "start": 103.8, + "end": 103.92, + "confidence": 0.983 + }, + { + "text": "rapport", + "start": 103.92, + "end": 104.22, + "confidence": 0.998 + }, + { + "text": "est", + "start": 104.22, + "end": 104.88, + "confidence": 0.942 + }, + { + "text": "totalement", + "start": 104.88, + "end": 105.24, + "confidence": 0.907 + } + ] + }, + { + "id": 29, + "seek": 8210, + "start": 105.24, + "end": 106.1, + "text": " inédit.", + "tokens": [ + 51530, + 294, + 7811, + 270, + 13, + 51580 + ], + "temperature": 0.0, + "avg_logprob": -0.45904387403654573, + "compression_ratio": 1.6159169550173011, + "no_speech_prob": 0.2066797912120819, + "confidence": 0.939, + "words": [ + { + "text": "inédit.", + "start": 105.24, + "end": 106.1, + "confidence": 0.939 + } + ] + }, + { + "id": 30, + "seek": 8210, + "start": 106.16, + "end": 109.44, + "text": " Mais j'ai l'impression comme ça que Nicolas se trompe pas vraiment.", + "tokens": [ + 51580, + 6313, + 361, + 6, + 1301, + 287, + 6, + 36107, + 5173, + 2788, + 631, + 38268, + 369, + 504, + 298, + 494, + 1736, + 8322, + 13, + 51738 + ], + "temperature": 0.0, + "avg_logprob": -0.45904387403654573, + "compression_ratio": 1.6159169550173011, + "no_speech_prob": 0.2066797912120819, + "confidence": 0.811, + "words": [ + { + "text": "Mais", + "start": 106.16, + "end": 106.5, + "confidence": 0.721 + }, + { + "text": "j'ai", + "start": 106.5, + "end": 106.92, + "confidence": 0.91 + }, + { + "text": "l'impression", + "start": 106.92, + "end": 107.34, + "confidence": 0.956 + }, + { + "text": "comme", + "start": 107.34, + "end": 107.58, + "confidence": 0.7 + }, + { + "text": "ça", + "start": 107.58, + "end": 107.74, + "confidence": 0.953 + }, + { + "text": "que", + "start": 107.74, + "end": 108.06, + "confidence": 0.941 + }, + { + "text": "Nicolas", + "start": 108.06, + "end": 108.46, + "confidence": 0.994 + }, + { + "text": "se", + "start": 108.46, + "end": 108.68, + "confidence": 0.716 + }, + { + "text": "trompe", + "start": 108.68, + "end": 109.02, + "confidence": 0.54 + }, + { + "text": "pas", + "start": 109.02, + "end": 109.16, + "confidence": 0.886 + }, + { + "text": "vraiment.", + "start": 109.16, + "end": 109.44, + "confidence": 0.963 + } + ] + }, + { + "id": 31, + "seek": 8210, + "start": 109.92, + "end": 110.86, + "text": " Pour autant, je sache.", + "tokens": [ + 51738, + 8732, + 34081, + 11, + 1506, + 262, + 6000, + 13, + 51808 + ], + "temperature": 0.0, + "avg_logprob": -0.45904387403654573, + "compression_ratio": 1.6159169550173011, + "no_speech_prob": 0.2066797912120819, + "confidence": 0.6, + "words": [ + { + "text": "Pour", + "start": 109.92, + "end": 110.1, + "confidence": 0.49 + }, + { + "text": "autant,", + "start": 110.1, + "end": 110.28, + "confidence": 0.75 + }, + { + "text": "je", + "start": 110.42, + "end": 110.48, + "confidence": 0.931 + }, + { + "text": "sache.", + "start": 110.48, + "end": 110.86, + "confidence": 0.477 + } + ] + }, + { + "id": 32, + "seek": 11098, + "start": 111.04, + "end": 115.0, + "text": " Il y a eu plein de discussions autour de la voiture ou même du téléphone.", + "tokens": [ + 50364, + 4416, + 288, + 257, + 2228, + 21088, + 368, + 11088, + 30249, + 368, + 635, + 38859, + 2820, + 5698, + 1581, + 47159, + 13, + 50568 + ], + "temperature": 0.0, + "avg_logprob": -0.44320285092493533, + "compression_ratio": 1.7050847457627119, + "no_speech_prob": 0.15390530228614807, + "confidence": 0.821, + "words": [ + { + "text": "Il", + "start": 111.04, + "end": 111.2, + "confidence": 0.905 + }, + { + "text": "y", + "start": 111.2, + "end": 111.3, + "confidence": 0.934 + }, + { + "text": "a", + "start": 111.3, + "end": 111.56, + "confidence": 0.893 + }, + { + "text": "eu", + "start": 111.56, + "end": 111.6, + "confidence": 0.839 + }, + { + "text": "plein", + "start": 111.6, + "end": 111.88, + "confidence": 0.776 + }, + { + "text": "de", + "start": 111.88, + "end": 112.12, + "confidence": 0.944 + }, + { + "text": "discussions", + "start": 112.12, + "end": 112.6, + "confidence": 0.681 + }, + { + "text": "autour", + "start": 112.6, + "end": 113.04, + "confidence": 0.978 + }, + { + "text": "de", + "start": 113.04, + "end": 113.48, + "confidence": 0.975 + }, + { + "text": "la", + "start": 113.48, + "end": 113.56, + "confidence": 0.966 + }, + { + "text": "voiture", + "start": 113.56, + "end": 113.88, + "confidence": 0.983 + }, + { + "text": "ou", + "start": 113.88, + "end": 114.14, + "confidence": 0.66 + }, + { + "text": "même", + "start": 114.14, + "end": 114.34, + "confidence": 0.99 + }, + { + "text": "du", + "start": 114.34, + "end": 114.64, + "confidence": 0.283 + }, + { + "text": "téléphone.", + "start": 114.64, + "end": 115.0, + "confidence": 0.986 + } + ] + }, + { + "id": 33, + "seek": 11098, + "start": 115.52, + "end": 119.51, + "text": " Mais, la dépense n'était pas du même mort, donc le rejet n'en plus n'était pas du même", + "tokens": [ + 50568, + 6313, + 11, + 635, + 27998, + 1288, + 297, + 6, + 9743, + 1736, + 1581, + 5698, + 6599, + 11, + 5926, + 476, + 319, + 7108, + 297, + 6, + 268, + 1804, + 297, + 6, + 9743, + 1736, + 1581, + 5698, + 50790 + ], + "temperature": 0.0, + "avg_logprob": -0.44320285092493533, + "compression_ratio": 1.7050847457627119, + "no_speech_prob": 0.15390530228614807, + "confidence": 0.701, + "words": [ + { + "text": "Mais,", + "start": 115.52, + "end": 115.82, + "confidence": 0.983 + }, + { + "text": "la", + "start": 115.9, + "end": 116.0, + "confidence": 0.961 + }, + { + "text": "dépense", + "start": 116.0, + "end": 116.42, + "confidence": 0.616 + }, + { + "text": "n'était", + "start": 116.42, + "end": 116.82, + "confidence": 0.955 + }, + { + "text": "pas", + "start": 116.82, + "end": 117.04, + "confidence": 0.994 + }, + { + "text": "du", + "start": 117.04, + "end": 117.2, + "confidence": 0.958 + }, + { + "text": "même", + "start": 117.2, + "end": 117.38, + "confidence": 0.929 + }, + { + "text": "mort,", + "start": 117.38, + "end": 117.58, + "confidence": 0.686 + }, + { + "text": "donc", + "start": 117.7, + "end": 118.02, + "confidence": 0.932 + }, + { + "text": "le", + "start": 118.02, + "end": 118.34, + "confidence": 0.95 + }, + { + "text": "rejet", + "start": 118.34, + "end": 118.64, + "confidence": 0.57 + }, + { + "text": "n'en", + "start": 118.64, + "end": 118.82, + "confidence": 0.429 + }, + { + "text": "plus", + "start": 118.82, + "end": 118.96, + "confidence": 0.055 + }, + { + "text": "n'était", + "start": 118.96, + "end": 119.16, + "confidence": 0.973 + }, + { + "text": "pas", + "start": 119.16, + "end": 119.32, + "confidence": 0.993 + }, + { + "text": "du", + "start": 119.32, + "end": 119.42, + "confidence": 0.823 + }, + { + "text": "même", + "start": 119.42, + "end": 119.51, + "confidence": 0.79 + } + ] + }, + { + "id": 34, + "seek": 11098, + "start": 119.51, + "end": 119.72, + "text": " mort.", + "tokens": [ + 50790, + 6599, + 13, + 50840 + ], + "temperature": 0.0, + "avg_logprob": -0.44320285092493533, + "compression_ratio": 1.7050847457627119, + "no_speech_prob": 0.15390530228614807, + "confidence": 0.639, + "words": [ + { + "text": "mort.", + "start": 119.51, + "end": 119.72, + "confidence": 0.639 + } + ] + }, + { + "id": 35, + "seek": 11098, + "start": 120.04, + "end": 121.24, + "text": " On peut adorer sa bagnure.", + "tokens": [ + 50840, + 1282, + 5977, + 614, + 17618, + 601, + 3411, + 77, + 540, + 13, + 50890 + ], + "temperature": 0.0, + "avg_logprob": -0.44320285092493533, + "compression_ratio": 1.7050847457627119, + "no_speech_prob": 0.15390530228614807, + "confidence": 0.615, + "words": [ + { + "text": "On", + "start": 120.04, + "end": 120.22, + "confidence": 0.981 + }, + { + "text": "peut", + "start": 120.22, + "end": 120.36, + "confidence": 0.988 + }, + { + "text": "adorer", + "start": 120.36, + "end": 120.7, + "confidence": 0.859 + }, + { + "text": "sa", + "start": 120.7, + "end": 120.88, + "confidence": 0.918 + }, + { + "text": "bagnure.", + "start": 120.88, + "end": 121.24, + "confidence": 0.314 + } + ] + }, + { + "id": 36, + "seek": 11098, + "start": 121.38, + "end": 123.06, + "text": " On a par besoin pour plein de choses.", + "tokens": [ + 50890, + 1282, + 257, + 971, + 19207, + 2016, + 21088, + 368, + 14488, + 13, + 50972 + ], + "temperature": 0.0, + "avg_logprob": -0.44320285092493533, + "compression_ratio": 1.7050847457627119, + "no_speech_prob": 0.15390530228614807, + "confidence": 0.722, + "words": [ + { + "text": "On", + "start": 121.38, + "end": 121.56, + "confidence": 0.897 + }, + { + "text": "a", + "start": 121.56, + "end": 121.64, + "confidence": 0.656 + }, + { + "text": "par", + "start": 121.64, + "end": 121.8, + "confidence": 0.161 + }, + { + "text": "besoin", + "start": 121.8, + "end": 122.12, + "confidence": 0.947 + }, + { + "text": "pour", + "start": 122.12, + "end": 122.5, + "confidence": 0.976 + }, + { + "text": "plein", + "start": 122.5, + "end": 122.72, + "confidence": 0.857 + }, + { + "text": "de", + "start": 122.72, + "end": 122.8, + "confidence": 0.993 + }, + { + "text": "choses.", + "start": 122.8, + "end": 123.06, + "confidence": 0.989 + } + ] + }, + { + "id": 37, + "seek": 11098, + "start": 123.36, + "end": 126.46, + "text": " Et là, le soir, quand on va se coucher, on la laisse.", + "tokens": [ + 50972, + 3790, + 3684, + 11, + 476, + 27105, + 11, + 6932, + 322, + 2773, + 369, + 1384, + 6759, + 11, + 322, + 635, + 30969, + 13, + 51142 + ], + "temperature": 0.0, + "avg_logprob": -0.44320285092493533, + "compression_ratio": 1.7050847457627119, + "no_speech_prob": 0.15390530228614807, + "confidence": 0.835, + "words": [ + { + "text": "Et", + "start": 123.36, + "end": 123.5, + "confidence": 0.606 + }, + { + "text": "là,", + "start": 123.5, + "end": 123.76, + "confidence": 0.498 + }, + { + "text": "le", + "start": 123.82, + "end": 124.06, + "confidence": 0.986 + }, + { + "text": "soir,", + "start": 124.06, + "end": 124.42, + "confidence": 0.971 + }, + { + "text": "quand", + "start": 124.84, + "end": 124.96, + "confidence": 0.787 + }, + { + "text": "on", + "start": 124.96, + "end": 125.06, + "confidence": 0.988 + }, + { + "text": "va", + "start": 125.06, + "end": 125.18, + "confidence": 0.966 + }, + { + "text": "se", + "start": 125.18, + "end": 125.26, + "confidence": 0.869 + }, + { + "text": "coucher,", + "start": 125.26, + "end": 125.6, + "confidence": 0.804 + }, + { + "text": "on", + "start": 125.82, + "end": 126.06, + "confidence": 0.98 + }, + { + "text": "la", + "start": 126.06, + "end": 126.2, + "confidence": 0.811 + }, + { + "text": "laisse.", + "start": 126.2, + "end": 126.46, + "confidence": 0.985 + } + ] + }, + { + "id": 38, + "seek": 11098, + "start": 127.06, + "end": 130.1, + "text": " On la pade en la main quand on est colis, qu'on n'a même pas au chiot.", + "tokens": [ + 51142, + 1282, + 635, + 280, + 762, + 465, + 635, + 2135, + 6932, + 322, + 871, + 1173, + 271, + 11, + 421, + 6, + 266, + 297, + 6, + 64, + 5698, + 1736, + 1609, + 417, + 6471, + 13, + 51334 + ], + "temperature": 0.0, + "avg_logprob": -0.44320285092493533, + "compression_ratio": 1.7050847457627119, + "no_speech_prob": 0.15390530228614807, + "confidence": 0.542, + "words": [ + { + "text": "On", + "start": 127.06, + "end": 127.32, + "confidence": 0.605 + }, + { + "text": "la", + "start": 127.32, + "end": 127.5, + "confidence": 0.35 + }, + { + "text": "pade", + "start": 127.5, + "end": 127.72, + "confidence": 0.18 + }, + { + "text": "en", + "start": 127.72, + "end": 127.88, + "confidence": 0.775 + }, + { + "text": "la", + "start": 127.88, + "end": 128.04, + "confidence": 0.795 + }, + { + "text": "main", + "start": 128.04, + "end": 128.3, + "confidence": 0.971 + }, + { + "text": "quand", + "start": 128.3, + "end": 128.46, + "confidence": 0.483 + }, + { + "text": "on", + "start": 128.46, + "end": 128.62, + "confidence": 0.994 + }, + { + "text": "est", + "start": 128.62, + "end": 128.74, + "confidence": 0.714 + }, + { + "text": "colis,", + "start": 128.74, + "end": 129.12, + "confidence": 0.501 + }, + { + "text": "qu'on", + "start": 129.22, + "end": 129.32, + "confidence": 0.777 + }, + { + "text": "n'a", + "start": 129.32, + "end": 129.42, + "confidence": 0.439 + }, + { + "text": "même", + "start": 129.42, + "end": 129.56, + "confidence": 0.324 + }, + { + "text": "pas", + "start": 129.56, + "end": 129.74, + "confidence": 1.0 + }, + { + "text": "au", + "start": 129.74, + "end": 129.88, + "confidence": 0.64 + }, + { + "text": "chiot.", + "start": 129.88, + "end": 130.1, + "confidence": 0.514 + } + ] + }, + { + "id": 39, + "seek": 11098, + "start": 130.94, + "end": 135.32, + "text": " On pouvait être émervé par son mome qui occupeait la ligne de téléphone pendant une heure", + "tokens": [ + 51334, + 1282, + 45913, + 7418, + 1136, + 936, + 15797, + 971, + 1872, + 275, + 423, + 1956, + 2678, + 84, + 494, + 1001, + 635, + 34207, + 368, + 47159, + 17338, + 2251, + 30027, + 51574 + ], + "temperature": 0.0, + "avg_logprob": -0.44320285092493533, + "compression_ratio": 1.7050847457627119, + "no_speech_prob": 0.15390530228614807, + "confidence": 0.656, + "words": [ + { + "text": "On", + "start": 130.94, + "end": 131.04, + "confidence": 0.99 + }, + { + "text": "pouvait", + "start": 131.04, + "end": 131.28, + "confidence": 0.588 + }, + { + "text": "être", + "start": 131.28, + "end": 131.6, + "confidence": 0.446 + }, + { + "text": "émervé", + "start": 131.6, + "end": 132.24, + "confidence": 0.725 + }, + { + "text": "par", + "start": 132.24, + "end": 132.5, + "confidence": 0.848 + }, + { + "text": "son", + "start": 132.5, + "end": 132.7, + "confidence": 0.445 + }, + { + "text": "mome", + "start": 132.7, + "end": 133.08, + "confidence": 0.255 + }, + { + "text": "qui", + "start": 133.08, + "end": 133.3, + "confidence": 0.911 + }, + { + "text": "occupeait", + "start": 133.3, + "end": 133.74, + "confidence": 0.642 + }, + { + "text": "la", + "start": 133.74, + "end": 133.86, + "confidence": 0.808 + }, + { + "text": "ligne", + "start": 133.86, + "end": 134.02, + "confidence": 0.975 + }, + { + "text": "de", + "start": 134.02, + "end": 134.24, + "confidence": 0.928 + }, + { + "text": "téléphone", + "start": 134.24, + "end": 134.56, + "confidence": 0.978 + }, + { + "text": "pendant", + "start": 134.56, + "end": 134.92, + "confidence": 0.901 + }, + { + "text": "une", + "start": 134.92, + "end": 135.18, + "confidence": 0.811 + }, + { + "text": "heure", + "start": 135.18, + "end": 135.32, + "confidence": 0.477 + } + ] + }, + { + "id": 40, + "seek": 11098, + "start": 135.32, + "end": 137.04, + "text": " chaque soir pour discuter avec un copain.", + "tokens": [ + 51574, + 18920, + 27105, + 2016, + 2983, + 20314, + 4163, + 517, + 2971, + 491, + 13, + 51664 + ], + "temperature": 0.0, + "avg_logprob": -0.44320285092493533, + "compression_ratio": 1.7050847457627119, + "no_speech_prob": 0.15390530228614807, + "confidence": 0.955, + "words": [ + { + "text": "chaque", + "start": 135.32, + "end": 135.6, + "confidence": 0.99 + }, + { + "text": "soir", + "start": 135.6, + "end": 135.8, + "confidence": 0.997 + }, + { + "text": "pour", + "start": 135.8, + "end": 136.0, + "confidence": 0.981 + }, + { + "text": "discuter", + "start": 136.0, + "end": 136.34, + "confidence": 0.882 + }, + { + "text": "avec", + "start": 136.34, + "end": 136.5, + "confidence": 0.993 + }, + { + "text": "un", + "start": 136.5, + "end": 136.62, + "confidence": 0.967 + }, + { + "text": "copain.", + "start": 136.62, + "end": 137.04, + "confidence": 0.953 + } + ] + }, + { + "id": 41, + "seek": 13698, + "start": 137.32, + "end": 141.84, + "text": " Mais ça ne ressemble pas à ce qu'on peut ressentir à voir même mome aujourd'hui.", + "tokens": [ + 50376, + 6313, + 2788, + 408, + 725, + 37227, + 1736, + 1531, + 1769, + 421, + 6, + 266, + 5977, + 24689, + 317, + 347, + 1531, + 10695, + 5698, + 275, + 423, + 14023, + 6, + 10556, + 13, + 50606 + ], + "temperature": 0.0, + "avg_logprob": -0.5337450312471937, + "compression_ratio": 1.6231454005934718, + "no_speech_prob": 0.1096271350979805, + "confidence": 0.735, + "words": [ + { + "text": "Mais", + "start": 137.32, + "end": 137.52, + "confidence": 0.984 + }, + { + "text": "ça", + "start": 137.52, + "end": 137.7, + "confidence": 0.877 + }, + { + "text": "ne", + "start": 137.7, + "end": 137.8, + "confidence": 0.672 + }, + { + "text": "ressemble", + "start": 137.8, + "end": 138.22, + "confidence": 0.731 + }, + { + "text": "pas", + "start": 138.22, + "end": 138.76, + "confidence": 0.526 + }, + { + "text": "à", + "start": 138.76, + "end": 138.94, + "confidence": 0.98 + }, + { + "text": "ce", + "start": 138.94, + "end": 139.08, + "confidence": 0.578 + }, + { + "text": "qu'on", + "start": 139.08, + "end": 139.22, + "confidence": 0.96 + }, + { + "text": "peut", + "start": 139.22, + "end": 139.38, + "confidence": 0.547 + }, + { + "text": "ressentir", + "start": 139.38, + "end": 140.06, + "confidence": 0.888 + }, + { + "text": "à", + "start": 140.06, + "end": 140.26, + "confidence": 0.437 + }, + { + "text": "voir", + "start": 140.26, + "end": 140.54, + "confidence": 0.952 + }, + { + "text": "même", + "start": 140.54, + "end": 140.96, + "confidence": 0.297 + }, + { + "text": "mome", + "start": 140.96, + "end": 141.22, + "confidence": 0.496 + }, + { + "text": "aujourd'hui.", + "start": 141.22, + "end": 141.84, + "confidence": 0.961 + } + ] + }, + { + "id": 42, + "seek": 13698, + "start": 141.96, + "end": 145.86, + "text": " Continuellement avec son smartphone dans la main, comme c'était une sorte de estimateur", + "tokens": [ + 50606, + 14674, + 31816, + 4163, + 1872, + 13307, + 2680, + 635, + 2135, + 11, + 5173, + 269, + 6, + 9743, + 2251, + 25559, + 368, + 8017, + 15540, + 50810 + ], + "temperature": 0.0, + "avg_logprob": -0.5337450312471937, + "compression_ratio": 1.6231454005934718, + "no_speech_prob": 0.1096271350979805, + "confidence": 0.663, + "words": [ + { + "text": "Continuellement", + "start": 141.96, + "end": 142.84, + "confidence": 0.844 + }, + { + "text": "avec", + "start": 142.84, + "end": 143.24, + "confidence": 0.646 + }, + { + "text": "son", + "start": 143.24, + "end": 143.42, + "confidence": 0.864 + }, + { + "text": "smartphone", + "start": 143.42, + "end": 143.72, + "confidence": 0.447 + }, + { + "text": "dans", + "start": 143.72, + "end": 143.92, + "confidence": 0.587 + }, + { + "text": "la", + "start": 143.92, + "end": 144.0, + "confidence": 0.974 + }, + { + "text": "main,", + "start": 144.0, + "end": 144.3, + "confidence": 0.995 + }, + { + "text": "comme", + "start": 144.42, + "end": 144.56, + "confidence": 0.895 + }, + { + "text": "c'était", + "start": 144.56, + "end": 144.84, + "confidence": 0.596 + }, + { + "text": "une", + "start": 144.84, + "end": 144.96, + "confidence": 0.972 + }, + { + "text": "sorte", + "start": 144.96, + "end": 145.1, + "confidence": 0.658 + }, + { + "text": "de", + "start": 145.1, + "end": 145.4, + "confidence": 0.312 + }, + { + "text": "estimateur", + "start": 145.4, + "end": 145.86, + "confidence": 0.489 + } + ] + }, + { + "id": 43, + "seek": 13698, + "start": 145.96, + "end": 149.0, + "text": " extère de tomber de lâcher à l'éantrénée, ça m'a eu immédiate.", + "tokens": [ + 50810, + 1279, + 4212, + 368, + 2916, + 607, + 368, + 48835, + 6759, + 1531, + 287, + 6, + 526, + 394, + 81, + 3516, + 3856, + 11, + 2788, + 275, + 6, + 64, + 2228, + 3397, + 526, + 4504, + 473, + 13, + 50954 + ], + "temperature": 0.0, + "avg_logprob": -0.5337450312471937, + "compression_ratio": 1.6231454005934718, + "no_speech_prob": 0.1096271350979805, + "confidence": 0.416, + "words": [ + { + "text": "extère", + "start": 145.96, + "end": 146.4, + "confidence": 0.371 + }, + { + "text": "de", + "start": 146.4, + "end": 146.54, + "confidence": 0.254 + }, + { + "text": "tomber", + "start": 146.54, + "end": 146.7, + "confidence": 0.102 + }, + { + "text": "de", + "start": 146.7, + "end": 146.9, + "confidence": 0.454 + }, + { + "text": "lâcher", + "start": 146.9, + "end": 147.34, + "confidence": 0.75 + }, + { + "text": "à", + "start": 147.34, + "end": 147.46, + "confidence": 0.444 + }, + { + "text": "l'éantrénée,", + "start": 147.46, + "end": 147.9, + "confidence": 0.491 + }, + { + "text": "ça", + "start": 148.0, + "end": 148.02, + "confidence": 0.799 + }, + { + "text": "m'a", + "start": 148.02, + "end": 148.26, + "confidence": 0.531 + }, + { + "text": "eu", + "start": 148.26, + "end": 148.44, + "confidence": 0.136 + }, + { + "text": "immédiate.", + "start": 148.44, + "end": 149.0, + "confidence": 0.505 + } + ] + }, + { + "id": 44, + "seek": 13698, + "start": 149.08, + "end": 151.98, + "text": " Bon, je dis ça pour le mome, mais évidemment, va là, bon aussi.", + "tokens": [ + 50954, + 7368, + 11, + 1506, + 717, + 2788, + 2016, + 476, + 275, + 423, + 11, + 2420, + 24724, + 11, + 2773, + 3684, + 11, + 4428, + 6212, + 13, + 51126 + ], + "temperature": 0.0, + "avg_logprob": -0.5337450312471937, + "compression_ratio": 1.6231454005934718, + "no_speech_prob": 0.1096271350979805, + "confidence": 0.564, + "words": [ + { + "text": "Bon,", + "start": 149.08, + "end": 149.28, + "confidence": 0.375 + }, + { + "text": "je", + "start": 149.34, + "end": 149.4, + "confidence": 0.471 + }, + { + "text": "dis", + "start": 149.4, + "end": 149.46, + "confidence": 0.324 + }, + { + "text": "ça", + "start": 149.46, + "end": 149.64, + "confidence": 0.952 + }, + { + "text": "pour", + "start": 149.64, + "end": 149.8, + "confidence": 0.963 + }, + { + "text": "le", + "start": 149.8, + "end": 149.92, + "confidence": 0.992 + }, + { + "text": "mome,", + "start": 149.92, + "end": 150.12, + "confidence": 0.619 + }, + { + "text": "mais", + "start": 150.46, + "end": 150.52, + "confidence": 0.694 + }, + { + "text": "évidemment,", + "start": 150.52, + "end": 151.12, + "confidence": 0.776 + }, + { + "text": "va", + "start": 151.26, + "end": 151.36, + "confidence": 0.388 + }, + { + "text": "là,", + "start": 151.36, + "end": 151.46, + "confidence": 0.59 + }, + { + "text": "bon", + "start": 151.6, + "end": 151.68, + "confidence": 0.825 + }, + { + "text": "aussi.", + "start": 151.68, + "end": 151.98, + "confidence": 0.162 + } + ] + }, + { + "id": 45, + "seek": 13698, + "start": 152.64, + "end": 154.64, + "text": " Donc, rapport immédiate d'accord.", + "tokens": [ + 51126, + 7477, + 11, + 18018, + 3397, + 526, + 4504, + 473, + 274, + 6, + 19947, + 13, + 51248 + ], + "temperature": 0.0, + "avg_logprob": -0.5337450312471937, + "compression_ratio": 1.6231454005934718, + "no_speech_prob": 0.1096271350979805, + "confidence": 0.861, + "words": [ + { + "text": "Donc,", + "start": 152.64, + "end": 153.08, + "confidence": 0.982 + }, + { + "text": "rapport", + "start": 153.16, + "end": 153.58, + "confidence": 0.979 + }, + { + "text": "immédiate", + "start": 153.58, + "end": 154.28, + "confidence": 0.841 + }, + { + "text": "d'accord.", + "start": 154.28, + "end": 154.64, + "confidence": 0.816 + } + ] + }, + { + "id": 46, + "seek": 13698, + "start": 155.66, + "end": 158.36, + "text": " Mais pourquoi, à ton impression qu'on en sortira, j'amé?", + "tokens": [ + 51248, + 6313, + 19934, + 11, + 1531, + 2952, + 9995, + 421, + 6, + 266, + 465, + 26906, + 64, + 11, + 361, + 6, + 335, + 526, + 30, + 51440 + ], + "temperature": 0.0, + "avg_logprob": -0.5337450312471937, + "compression_ratio": 1.6231454005934718, + "no_speech_prob": 0.1096271350979805, + "confidence": 0.709, + "words": [ + { + "text": "Mais", + "start": 155.66, + "end": 155.88, + "confidence": 0.984 + }, + { + "text": "pourquoi,", + "start": 155.88, + "end": 156.28, + "confidence": 0.897 + }, + { + "text": "à", + "start": 156.38, + "end": 156.58, + "confidence": 0.837 + }, + { + "text": "ton", + "start": 156.58, + "end": 156.7, + "confidence": 0.953 + }, + { + "text": "impression", + "start": 156.7, + "end": 157.06, + "confidence": 0.938 + }, + { + "text": "qu'on", + "start": 157.06, + "end": 157.28, + "confidence": 0.89 + }, + { + "text": "en", + "start": 157.28, + "end": 157.4, + "confidence": 0.801 + }, + { + "text": "sortira,", + "start": 157.4, + "end": 157.88, + "confidence": 0.576 + }, + { + "text": "j'amé?", + "start": 157.96, + "end": 158.36, + "confidence": 0.464 + } + ] + }, + { + "id": 47, + "seek": 13698, + "start": 159.16, + "end": 163.32, + "text": " Et puis, il faut en remettre la faute sur les gens qui ont créé cette critique merveilleux", + "tokens": [ + 51440, + 3790, + 9093, + 11, + 1930, + 8487, + 465, + 890, + 40681, + 635, + 2050, + 1169, + 1022, + 1512, + 10668, + 1956, + 6592, + 15609, + 526, + 5550, + 25673, + 3551, + 303, + 3409, + 2449, + 51678 + ], + "temperature": 0.0, + "avg_logprob": -0.5337450312471937, + "compression_ratio": 1.6231454005934718, + "no_speech_prob": 0.1096271350979805, + "confidence": 0.714, + "words": [ + { + "text": "Et", + "start": 159.16, + "end": 159.32, + "confidence": 0.832 + }, + { + "text": "puis,", + "start": 159.32, + "end": 159.46, + "confidence": 0.494 + }, + { + "text": "il", + "start": 159.62, + "end": 159.64, + "confidence": 0.594 + }, + { + "text": "faut", + "start": 159.64, + "end": 159.66, + "confidence": 0.951 + }, + { + "text": "en", + "start": 159.66, + "end": 159.78, + "confidence": 0.937 + }, + { + "text": "remettre", + "start": 159.78, + "end": 160.14, + "confidence": 0.984 + }, + { + "text": "la", + "start": 160.14, + "end": 160.42, + "confidence": 0.602 + }, + { + "text": "faute", + "start": 160.42, + "end": 160.68, + "confidence": 0.59 + }, + { + "text": "sur", + "start": 160.68, + "end": 160.98, + "confidence": 0.966 + }, + { + "text": "les", + "start": 160.98, + "end": 161.24, + "confidence": 0.828 + }, + { + "text": "gens", + "start": 161.24, + "end": 161.46, + "confidence": 0.986 + }, + { + "text": "qui", + "start": 161.46, + "end": 161.6, + "confidence": 0.98 + }, + { + "text": "ont", + "start": 161.6, + "end": 161.68, + "confidence": 0.95 + }, + { + "text": "créé", + "start": 161.68, + "end": 162.3, + "confidence": 0.95 + }, + { + "text": "cette", + "start": 162.3, + "end": 162.48, + "confidence": 0.908 + }, + { + "text": "critique", + "start": 162.48, + "end": 162.72, + "confidence": 0.032 + }, + { + "text": "merveilleux", + "start": 162.72, + "end": 163.32, + "confidence": 0.839 + } + ] + }, + { + "id": 48, + "seek": 13698, + "start": 163.32, + "end": 165.34, + "text": " et diabolique et diabolique par que merveilleux.", + "tokens": [ + 51678, + 1030, + 1026, + 14923, + 1925, + 1030, + 1026, + 14923, + 1925, + 971, + 631, + 3551, + 303, + 3409, + 2449, + 13, + 51778 + ], + "temperature": 0.0, + "avg_logprob": -0.5337450312471937, + "compression_ratio": 1.6231454005934718, + "no_speech_prob": 0.1096271350979805, + "confidence": 0.708, + "words": [ + { + "text": "et", + "start": 163.32, + "end": 163.44, + "confidence": 0.945 + }, + { + "text": "diabolique", + "start": 163.44, + "end": 163.86, + "confidence": 0.573 + }, + { + "text": "et", + "start": 163.86, + "end": 163.94, + "confidence": 0.238 + }, + { + "text": "diabolique", + "start": 163.94, + "end": 164.38, + "confidence": 0.892 + }, + { + "text": "par", + "start": 164.38, + "end": 164.62, + "confidence": 0.544 + }, + { + "text": "que", + "start": 164.62, + "end": 164.82, + "confidence": 0.529 + }, + { + "text": "merveilleux.", + "start": 164.82, + "end": 165.34, + "confidence": 0.981 + } + ] + }, + { + "id": 49, + "seek": 16526, + "start": 166.9, + "end": 168.8, + "text": " Les économistes parlent de dépendance du santé.", + "tokens": [ + 50410, + 6965, + 31171, + 22368, + 13734, + 317, + 368, + 45768, + 719, + 1581, + 30068, + 13, + 50542 + ], + "temperature": 0.0, + "avg_logprob": -0.6644235849380493, + "compression_ratio": 1.4761904761904763, + "no_speech_prob": 0.1915542334318161, + "confidence": 0.765, + "words": [ + { + "text": "Les", + "start": 166.9, + "end": 167.06, + "confidence": 0.699 + }, + { + "text": "économistes", + "start": 167.06, + "end": 167.52, + "confidence": 0.917 + }, + { + "text": "parlent", + "start": 167.52, + "end": 167.78, + "confidence": 0.793 + }, + { + "text": "de", + "start": 167.78, + "end": 167.84, + "confidence": 0.813 + }, + { + "text": "dépendance", + "start": 167.84, + "end": 168.36, + "confidence": 0.698 + }, + { + "text": "du", + "start": 168.36, + "end": 168.5, + "confidence": 0.963 + }, + { + "text": "santé.", + "start": 168.5, + "end": 168.8, + "confidence": 0.489 + } + ] + }, + { + "id": 50, + "seek": 16526, + "start": 168.82, + "end": 173.42, + "text": " Ces vidéos, en fait, on est un santé qui a été étabis, un soit mon termine, en marchand dessus,", + "tokens": [ + 50542, + 28414, + 25417, + 11, + 465, + 3887, + 11, + 322, + 871, + 517, + 30068, + 1956, + 257, + 8862, + 4823, + 455, + 271, + 11, + 517, + 12703, + 1108, + 1433, + 533, + 11, + 465, + 8368, + 474, + 30677, + 11, + 50784 + ], + "temperature": 0.0, + "avg_logprob": -0.6644235849380493, + "compression_ratio": 1.4761904761904763, + "no_speech_prob": 0.1915542334318161, + "confidence": 0.474, + "words": [ + { + "text": "Ces", + "start": 168.82, + "end": 169.14, + "confidence": 0.443 + }, + { + "text": "vidéos,", + "start": 169.14, + "end": 169.4, + "confidence": 0.455 + }, + { + "text": "en", + "start": 169.44, + "end": 169.64, + "confidence": 0.744 + }, + { + "text": "fait,", + "start": 169.64, + "end": 169.66, + "confidence": 0.976 + }, + { + "text": "on", + "start": 169.72, + "end": 169.74, + "confidence": 0.303 + }, + { + "text": "est", + "start": 169.74, + "end": 169.9, + "confidence": 0.814 + }, + { + "text": "un", + "start": 169.9, + "end": 170.48, + "confidence": 0.367 + }, + { + "text": "santé", + "start": 170.48, + "end": 170.8, + "confidence": 0.951 + }, + { + "text": "qui", + "start": 170.8, + "end": 170.92, + "confidence": 0.835 + }, + { + "text": "a", + "start": 170.92, + "end": 171.02, + "confidence": 0.819 + }, + { + "text": "été", + "start": 171.02, + "end": 171.12, + "confidence": 0.994 + }, + { + "text": "étabis,", + "start": 171.12, + "end": 171.5, + "confidence": 0.343 + }, + { + "text": "un", + "start": 171.76, + "end": 171.9, + "confidence": 0.236 + }, + { + "text": "soit", + "start": 171.9, + "end": 172.16, + "confidence": 0.31 + }, + { + "text": "mon", + "start": 172.16, + "end": 172.36, + "confidence": 0.205 + }, + { + "text": "termine,", + "start": 172.36, + "end": 172.72, + "confidence": 0.4 + }, + { + "text": "en", + "start": 172.8, + "end": 172.82, + "confidence": 0.309 + }, + { + "text": "marchand", + "start": 172.82, + "end": 173.14, + "confidence": 0.816 + }, + { + "text": "dessus,", + "start": 173.14, + "end": 173.42, + "confidence": 0.201 + } + ] + }, + { + "id": 51, + "seek": 16526, + "start": 173.86, + "end": 177.42, + "text": " soit des finissants débordes, des finissants, une signalétique.", + "tokens": [ + 50784, + 12703, + 730, + 962, + 891, + 1719, + 36529, + 765, + 279, + 11, + 730, + 962, + 891, + 1719, + 11, + 2251, + 6358, + 42379, + 13, + 50974 + ], + "temperature": 0.0, + "avg_logprob": -0.6644235849380493, + "compression_ratio": 1.4761904761904763, + "no_speech_prob": 0.1915542334318161, + "confidence": 0.582, + "words": [ + { + "text": "soit", + "start": 173.86, + "end": 174.4, + "confidence": 0.993 + }, + { + "text": "des", + "start": 174.4, + "end": 175.2, + "confidence": 0.759 + }, + { + "text": "finissants", + "start": 175.2, + "end": 175.58, + "confidence": 0.436 + }, + { + "text": "débordes,", + "start": 175.58, + "end": 175.98, + "confidence": 0.467 + }, + { + "text": "des", + "start": 176.14, + "end": 176.18, + "confidence": 0.222 + }, + { + "text": "finissants,", + "start": 176.18, + "end": 176.62, + "confidence": 0.961 + }, + { + "text": "une", + "start": 176.66, + "end": 176.84, + "confidence": 0.75 + }, + { + "text": "signalétique.", + "start": 176.84, + "end": 177.42, + "confidence": 0.566 + } + ] + } + ], + "language": "fr" +} \ No newline at end of file diff --git a/tests/expected/verbose.cpu/accurate.auto_bonjour_vous_allez_bien.mp3.stdout b/tests/expected/verbose.cpu/accurate.auto_bonjour_vous_allez_bien.mp3.stdout new file mode 100644 index 0000000000000000000000000000000000000000..532d5eaf637389f5cfdbecc58823d2ccd29cfacb --- /dev/null +++ b/tests/expected/verbose.cpu/accurate.auto_bonjour_vous_allez_bien.mp3.stdout @@ -0,0 +1,11 @@ +[00:00.460 --> 00:00.780] Боже +[00:00.780 --> 00:01.980] улыл! +[00:02.020 --> 00:02.260] Таков +[00:02.260 --> 00:02.400] уже +[00:02.400 --> 00:02.460] на +[00:02.460 --> 00:02.800] меня! +[00:32.980 --> 00:33.280] Боже +[00:33.280 --> 00:33.800] улыл! +[00:34.400 --> 00:34.800] Эскому +[00:34.800 --> 00:34.960] за +[00:34.960 --> 00:35.260] меня! diff --git a/tests/expected/verbose.cpu/accurate.fr_bonjour_vous_allez_bien.mp3.stdout b/tests/expected/verbose.cpu/accurate.fr_bonjour_vous_allez_bien.mp3.stdout new file mode 100644 index 0000000000000000000000000000000000000000..bbe59141c7bb85cc4567ff0ac51949b691aea753 --- /dev/null +++ b/tests/expected/verbose.cpu/accurate.fr_bonjour_vous_allez_bien.mp3.stdout @@ -0,0 +1,13 @@ +[00:00.460 --> 00:00.680] Bonjour! +[00:01.860 --> 00:02.140] Est-ce +[00:02.140 --> 00:02.180] que +[00:02.180 --> 00:02.340] vous +[00:02.340 --> 00:02.480] allez +[00:02.480 --> 00:02.800] bien? +[00:32.980 --> 00:33.160] Bonjour! +[00:34.400 --> 00:34.610] Bonjour! +[00:34.610 --> 00:34.660] Est-ce +[00:34.660 --> 00:34.720] que +[00:34.720 --> 00:34.860] vous +[00:34.860 --> 00:35.000] allez +[00:35.000 --> 00:35.340] bien? diff --git a/tests/expected/verbose.cpu/efficient.auto_bonjour_vous_allez_bien.mp3.stdout b/tests/expected/verbose.cpu/efficient.auto_bonjour_vous_allez_bien.mp3.stdout new file mode 100644 index 0000000000000000000000000000000000000000..532d5eaf637389f5cfdbecc58823d2ccd29cfacb --- /dev/null +++ b/tests/expected/verbose.cpu/efficient.auto_bonjour_vous_allez_bien.mp3.stdout @@ -0,0 +1,11 @@ +[00:00.460 --> 00:00.780] Боже +[00:00.780 --> 00:01.980] улыл! +[00:02.020 --> 00:02.260] Таков +[00:02.260 --> 00:02.400] уже +[00:02.400 --> 00:02.460] на +[00:02.460 --> 00:02.800] меня! +[00:32.980 --> 00:33.280] Боже +[00:33.280 --> 00:33.800] улыл! +[00:34.400 --> 00:34.800] Эскому +[00:34.800 --> 00:34.960] за +[00:34.960 --> 00:35.260] меня! diff --git a/tests/expected/verbose.cpu/efficient.fr_bonjour_vous_allez_bien.mp3.stdout b/tests/expected/verbose.cpu/efficient.fr_bonjour_vous_allez_bien.mp3.stdout new file mode 100644 index 0000000000000000000000000000000000000000..bbe59141c7bb85cc4567ff0ac51949b691aea753 --- /dev/null +++ b/tests/expected/verbose.cpu/efficient.fr_bonjour_vous_allez_bien.mp3.stdout @@ -0,0 +1,13 @@ +[00:00.460 --> 00:00.680] Bonjour! +[00:01.860 --> 00:02.140] Est-ce +[00:02.140 --> 00:02.180] que +[00:02.180 --> 00:02.340] vous +[00:02.340 --> 00:02.480] allez +[00:02.480 --> 00:02.800] bien? +[00:32.980 --> 00:33.160] Bonjour! +[00:34.400 --> 00:34.610] Bonjour! +[00:34.610 --> 00:34.660] Est-ce +[00:34.660 --> 00:34.720] que +[00:34.720 --> 00:34.860] vous +[00:34.860 --> 00:35.000] allez +[00:35.000 --> 00:35.340] bien? diff --git a/tests/expected/verbose.cpu/hf_bonjour.wav.stdout b/tests/expected/verbose.cpu/hf_bonjour.wav.stdout new file mode 100644 index 0000000000000000000000000000000000000000..99635535fd87302067c97ce13d42f2988dacdd83 --- /dev/null +++ b/tests/expected/verbose.cpu/hf_bonjour.wav.stdout @@ -0,0 +1,3 @@ +Detecting language using up to the first 30 seconds. Use `--language` to specify the language +Detected language: French +[00:00.120 --> 00:00.640] Bonjour. diff --git a/tests/expected/verbose/accurate.auto_bonjour_vous_allez_bien.mp3.stdout b/tests/expected/verbose/accurate.auto_bonjour_vous_allez_bien.mp3.stdout new file mode 100644 index 0000000000000000000000000000000000000000..6bfee4b97e33192bc46f69994bddcd817c220226 --- /dev/null +++ b/tests/expected/verbose/accurate.auto_bonjour_vous_allez_bien.mp3.stdout @@ -0,0 +1,10 @@ +Detecting language using up to the first 30 seconds. Use `--language` to specify the language +Detected language: Russian +[00:00.440 --> 00:00.860] Боже +[00:00.860 --> 00:01.880] улыл! +[00:01.880 --> 00:02.300] Эскому +[00:02.300 --> 00:03.140] зарегиан! +[00:32.980 --> 00:33.360] Боже +[00:33.360 --> 00:34.020] улыл! +[00:34.420 --> 00:34.840] Эскому +[00:34.840 --> 00:35.720] зарегиан! diff --git a/tests/expected/verbose/accurate.fr_bonjour_vous_allez_bien.mp3.stdout b/tests/expected/verbose/accurate.fr_bonjour_vous_allez_bien.mp3.stdout new file mode 100644 index 0000000000000000000000000000000000000000..ec0d882ef119c14b9da62584ee57728eab7691fd --- /dev/null +++ b/tests/expected/verbose/accurate.fr_bonjour_vous_allez_bien.mp3.stdout @@ -0,0 +1,11 @@ +[00:00.440 --> 00:01.440] Bonjour ! +[00:01.880 --> 00:02.200] Est-ce +[00:02.200 --> 00:02.240] que +[00:02.240 --> 00:02.360] vous +[00:02.360 --> 00:02.560] allez +[00:02.560 --> 00:03.120] bien ? +[00:32.980 --> 00:33.480] Bonjour ! +[00:34.420 --> 00:34.760] Esque +[00:34.760 --> 00:34.900] vous +[00:34.900 --> 00:35.080] allez +[00:35.080 --> 00:35.480] bien ! diff --git a/tests/expected/verbose/efficient.auto_bonjour_vous_allez_bien.mp3.stdout b/tests/expected/verbose/efficient.auto_bonjour_vous_allez_bien.mp3.stdout new file mode 100644 index 0000000000000000000000000000000000000000..6bfee4b97e33192bc46f69994bddcd817c220226 --- /dev/null +++ b/tests/expected/verbose/efficient.auto_bonjour_vous_allez_bien.mp3.stdout @@ -0,0 +1,10 @@ +Detecting language using up to the first 30 seconds. Use `--language` to specify the language +Detected language: Russian +[00:00.440 --> 00:00.860] Боже +[00:00.860 --> 00:01.880] улыл! +[00:01.880 --> 00:02.300] Эскому +[00:02.300 --> 00:03.140] зарегиан! +[00:32.980 --> 00:33.360] Боже +[00:33.360 --> 00:34.020] улыл! +[00:34.420 --> 00:34.840] Эскому +[00:34.840 --> 00:35.720] зарегиан! diff --git a/tests/expected/verbose/efficient.fr_bonjour_vous_allez_bien.mp3.stdout b/tests/expected/verbose/efficient.fr_bonjour_vous_allez_bien.mp3.stdout new file mode 100644 index 0000000000000000000000000000000000000000..ec0d882ef119c14b9da62584ee57728eab7691fd --- /dev/null +++ b/tests/expected/verbose/efficient.fr_bonjour_vous_allez_bien.mp3.stdout @@ -0,0 +1,11 @@ +[00:00.440 --> 00:01.440] Bonjour ! +[00:01.880 --> 00:02.200] Est-ce +[00:02.200 --> 00:02.240] que +[00:02.240 --> 00:02.360] vous +[00:02.360 --> 00:02.560] allez +[00:02.560 --> 00:03.120] bien ? +[00:32.980 --> 00:33.480] Bonjour ! +[00:34.420 --> 00:34.760] Esque +[00:34.760 --> 00:34.900] vous +[00:34.900 --> 00:35.080] allez +[00:35.080 --> 00:35.480] bien ! diff --git a/tests/expected/verbose/hf_bonjour.wav.stdout b/tests/expected/verbose/hf_bonjour.wav.stdout new file mode 100644 index 0000000000000000000000000000000000000000..99635535fd87302067c97ce13d42f2988dacdd83 --- /dev/null +++ b/tests/expected/verbose/hf_bonjour.wav.stdout @@ -0,0 +1,3 @@ +Detecting language using up to the first 30 seconds. Use `--language` to specify the language +Detected language: French +[00:00.120 --> 00:00.640] Bonjour. diff --git a/tests/expected/verbose/vad_auditok_words.wav.stdout b/tests/expected/verbose/vad_auditok_words.wav.stdout new file mode 100644 index 0000000000000000000000000000000000000000..f0d2d990dc8c2da3adf9a47ec88b0fbfac0c7af1 --- /dev/null +++ b/tests/expected/verbose/vad_auditok_words.wav.stdout @@ -0,0 +1,8 @@ +[00:00.750 --> 00:01.470] settlement, +[00:02.950 --> 00:03.670] Kentucky, +[00:05.770 --> 00:06.290] causing +[00:07.900 --> 00:08.950] damage, +[00:10.900 --> 00:11.700] President, +[00:14.200 --> 00:14.780] expansion, +[00:17.120 --> 00:17.760] hospital, +[00:20.730 --> 00:21.330] devastated. diff --git a/tests/expected/verbose/vad_silero3.0_words.wav.stdout b/tests/expected/verbose/vad_silero3.0_words.wav.stdout new file mode 100644 index 0000000000000000000000000000000000000000..79e9f6107b1e48c0323c7fcfd843f9f3a9bf1be9 --- /dev/null +++ b/tests/expected/verbose/vad_silero3.0_words.wav.stdout @@ -0,0 +1,8 @@ +[00:00.760 --> 00:01.480] settlement, +[00:02.890 --> 00:03.670] Kentucky, +[00:05.710 --> 00:06.270] causing +[00:07.850 --> 00:08.930] damage, +[00:10.940 --> 00:11.700] president, +[00:14.200 --> 00:14.780] expansion, +[00:17.120 --> 00:17.780] hospital, +[00:20.140 --> 00:21.380] devastated. diff --git a/tests/expected/verbose/vad_silero3.1_words.wav.stdout b/tests/expected/verbose/vad_silero3.1_words.wav.stdout new file mode 100644 index 0000000000000000000000000000000000000000..54b0fd0716a5eed94c6a92c3ea372b879cec5401 --- /dev/null +++ b/tests/expected/verbose/vad_silero3.1_words.wav.stdout @@ -0,0 +1,8 @@ +[00:00.760 --> 00:01.480] settlement, +[00:02.920 --> 00:03.660] Kentucky, +[00:05.760 --> 00:06.260] causing +[00:07.850 --> 00:08.940] damage, +[00:10.840 --> 00:11.700] president, +[00:14.190 --> 00:14.770] expansion, +[00:17.130 --> 00:17.750] hospital, +[00:21.200 --> 00:21.380] devastated. diff --git a/tests/expected/verbose/vad_words.wav.stdout b/tests/expected/verbose/vad_words.wav.stdout new file mode 100644 index 0000000000000000000000000000000000000000..5dbf58fc48651f530a5a99a116062ab15fe66aeb --- /dev/null +++ b/tests/expected/verbose/vad_words.wav.stdout @@ -0,0 +1,8 @@ +[00:00.760 --> 00:01.460] settlement, +[00:02.900 --> 00:03.680] Kentucky, +[00:05.710 --> 00:06.270] causing +[00:07.890 --> 00:08.940] damage, +[00:10.930 --> 00:11.690] president, +[00:14.070 --> 00:14.770] expansion, +[00:17.140 --> 00:17.780] hospital, +[00:20.730 --> 00:21.370] devastated. diff --git a/tests/json_schema.json b/tests/json_schema.json new file mode 100644 index 0000000000000000000000000000000000000000..63dfcc6e7ac6247c85d515442d144d744109fc12 --- /dev/null +++ b/tests/json_schema.json @@ -0,0 +1,41 @@ +{ + "type": "object", + "properties": { + "text": {"type": "string"}, + "segments": { + "type": "array", + "items": { + "type": "object", + "properties": { + "id": {"type": "integer", "minimum":0}, + "start": {"type": "number", "minimum":0}, + "end": {"type": "number", "minimum":0}, + "text": {"type": "string"}, + "tokens": { + "type": "array", + "items": {"type": "integer", "minimum": 0, "maximum": 51864} + }, + "temperature": {"type": "number", "minimum":0, "maximum":1}, + "avg_logprob": {"type": "number", "maximum":0}, + "compression_ratio": {"type": "number", "minimum":0}, + "no_speech_prob": {"type": "number", "minimum":0, "maximum":1}, + "confidence": {"type": "number", "minimum":0, "maximum":1}, + "words": { + "type": "array", + "items": { + "type": "object", + "properties": { + "text": {"type": "string"}, + "start": {"type": "number", "minimum":0}, + "end": {"type": "number", "minimum":0}, + "confidence": {"type": "number", "minimum":0, "maximum":1} + } + } + } + } + }, + "minItems": 0, + "uniqueItems": true + } + } +} diff --git a/tests/run_tests.py b/tests/run_tests.py new file mode 100644 index 0000000000000000000000000000000000000000..0b202b69af065c478fc99607b012ccec40cf5580 --- /dev/null +++ b/tests/run_tests.py @@ -0,0 +1,48 @@ +import sys +import unittest + +from test_transcribe import * +import test_transcribe + +if __name__ == '__main__': + + # Handle several ways of generating expected outputs + if "--long" in sys.argv: + test_transcribe.SKIP_LONG_TEST_IF_CPU = False + sys.argv.remove("--long") + if "--generate" in sys.argv: + test_transcribe.FAIL_IF_REFERENCE_NOT_FOUND = False + sys.argv.remove("--generate") + if "--generate_device" in sys.argv: + test_transcribe.GENERATE_DEVICE_DEPENDENT = True + test_transcribe.FAIL_IF_REFERENCE_NOT_FOUND = False + sys.argv.remove("--generate_device") + if "--generate_new" in sys.argv: + test_transcribe.GENERATE_NEW_ONLY = True + test_transcribe.FAIL_IF_REFERENCE_NOT_FOUND = False + sys.argv.remove("--generate_new") + if "--generate_all" in sys.argv: + test_transcribe.GENERATE_ALL = True + test_transcribe.FAIL_IF_REFERENCE_NOT_FOUND = False + sys.argv.remove("--generate_all") + + # Pass options to whisper_timestamped CLI + args = sys.argv[1:] + for i, arg in enumerate(args): + if arg not in [ + "-h", "--help", + "-v", "--verbose", + "--locals", + "-q", "--quiet", + "-f", "--failfast", + "-c", "--catch", + "-b", "--buffer", + "-k", + ] \ + and not arg.startswith("Test") \ + and (i==0 or args[i-1] not in ["-k"]) \ + and (arg.startswith("-") or (i>0 and args[i-1].startswith("-"))): + test_transcribe.CMD_OPTIONS.append(arg) + sys.argv.remove(arg) + + unittest.main() diff --git a/tests/test_transcribe.py b/tests/test_transcribe.py new file mode 100644 index 0000000000000000000000000000000000000000..d16830e6f4d767695da430692757d71f5253de16 --- /dev/null +++ b/tests/test_transcribe.py @@ -0,0 +1,880 @@ +__author__ = "Jérôme Louradour" +__credits__ = ["Jérôme Louradour"] +__license__ = "GPLv3" + +import unittest +import sys +import os +import subprocess +import shutil +import tempfile +import json +import torch +import jsonschema + +FAIL_IF_REFERENCE_NOT_FOUND = True +GENERATE_NEW_ONLY = False +GENERATE_ALL = False +GENERATE_DEVICE_DEPENDENT = False +SKIP_LONG_TEST_IF_CPU = True +CMD_OPTIONS = [] + + +class TestHelper(unittest.TestCase): + + def skipLongTests(self): + return SKIP_LONG_TEST_IF_CPU and not torch.cuda.is_available() + + def setUp(self): + self.maxDiff = None + self.createdReferences = [] + + def tearDown(self): + if GENERATE_ALL or GENERATE_NEW_ONLY or not FAIL_IF_REFERENCE_NOT_FOUND or GENERATE_DEVICE_DEPENDENT: + if len(self.createdReferences) > 0: + print("WARNING: Created references: " + + ", ".join(self.createdReferences).replace(self.get_data_path()+"/", "")) + else: + self.assertEqual(self.createdReferences, [], "Created references: " + + ", ".join(self.createdReferences).replace(self.get_data_path()+"/", "")) + + def get_main_path(self, fn=None, check=False): + return self._get_path("whisper_timestamped", fn, check=check) + + def get_output_path(self, fn=None): + if fn == None: + return tempfile.gettempdir() + return os.path.join(tempfile.gettempdir(), fn + self._extra_cmd_options()) + + def get_expected_path(self, fn=None, check=False): + return self._get_path("tests/expected" + self._extra_cmd_options(), fn, check=check) + + def _extra_cmd_options(self): + s = "".join([f.replace("-","").strip() for f in CMD_OPTIONS]) + if s: + return "." + s + return "" + + def get_data_files(self, files=None, excluded_by_default=["apollo11.mp3", "music.mp4", "arabic.mp3", "japanese.mp3", "empty.wav", "words.wav"]): + if files == None: + files = os.listdir(self.get_data_path()) + files = [f for f in files if f not in excluded_by_default and not f.endswith("json")] + files = sorted(files) + return [self.get_data_path(fn) for fn in files] + + def get_generated_files(self, input_filename, output_path, extensions): + for ext in extensions: + yield os.path.join(output_path, os.path.basename(input_filename) + "." + ext.lstrip(".")) + + def main_script(self, pyscript = "transcribe.py", exename = "whisper_timestamped"): + main_script = self.get_main_path(pyscript, check=False) + if not os.path.exists(main_script): + main_script = exename + return main_script + + def assertRun(self, cmd): + if isinstance(cmd, str): + return self.assertRun(cmd.split()) + curdir = os.getcwd() + os.chdir(tempfile.gettempdir()) + if cmd[0].endswith(".py"): + cmd = [sys.executable] + cmd + print("Running:", " ".join(cmd)) + p = subprocess.Popen(cmd, + # Otherwise ".local" path might be missing + env=dict( + os.environ, PYTHONPATH=os.pathsep.join(sys.path)), + stdout=subprocess.PIPE, stderr=subprocess.PIPE + ) + os.chdir(curdir) + (stdout, stderr) = p.communicate() + self.assertEqual(p.returncode, 0, msg=stderr.decode("utf-8")) + return (stdout.decode("utf-8"), stderr.decode("utf-8")) + + def assertNonRegression(self, content, reference, string_is_file=True): + """ + Check that a file/folder is the same as a reference file/folder. + """ + if isinstance(content, dict): + # Make a temporary file + with tempfile.NamedTemporaryFile(mode="w", suffix=".json", encoding="utf8", delete=False) as f: + json.dump(content, f, indent=2, ensure_ascii=False) + content = f.name + res = self.assertNonRegression(f.name, reference) + os.remove(f.name) + return res + elif not isinstance(content, str): + raise ValueError(f"Invalid content type: {type(content)}") + + if not string_is_file: + with tempfile.NamedTemporaryFile(mode="w", suffix=".txt", encoding="utf8", delete=False) as f: + f.write(content) + content = f.name + res = self.assertNonRegression(f.name, reference) + os.remove(f.name) + return res + + self.assertTrue(os.path.exists(content), f"Missing file: {content}") + is_file = os.path.isfile(reference) if os.path.exists(reference) else os.path.isfile(content) + + reference = self.get_expected_path( + reference, check=FAIL_IF_REFERENCE_NOT_FOUND) + if not os.path.exists(reference) or ((GENERATE_ALL or GENERATE_DEVICE_DEPENDENT) and reference not in self.createdReferences): + dirname = os.path.dirname(reference) + if not os.path.isdir(dirname): + os.makedirs(dirname) + if is_file: + shutil.copyfile(content, reference) + else: + shutil.copytree(content, reference) + self.createdReferences.append(reference) + + if is_file: + self.assertTrue(os.path.isfile(content)) + self._check_file_non_regression(content, reference) + else: + self.assertTrue(os.path.isdir(content)) + for root, dirs, files in os.walk(content): + for f in files: + f_ref = os.path.join(reference, f) + self.assertTrue(os.path.isfile(f_ref), + f"Additional file: {f}") + self._check_file_non_regression( + os.path.join(root, f), f_ref) + for root, dirs, files in os.walk(reference): + for f in files: + f = os.path.join(content, f) + self.assertTrue(os.path.isfile(f), f"Missing file: {f}") + + def get_data_path(self, fn=None, check=True): + return self._get_path("tests/data", fn, check) + + def _get_path(self, prefix, fn=None, check=True): + path = os.path.join( + os.path.dirname(os.path.dirname(__file__)), + prefix + ) + if fn: + path = os.path.join(path, fn) + if check: + self.assertTrue(os.path.exists(path), f"Cannot find {path}") + return path + + def _check_file_non_regression(self, file, reference): + if file.endswith(".json"): + with open(file) as f: + content = json.load(f) + with open(reference) as f: + reference_content = json.load(f) + if "language" in content and "language" in reference_content: + content["language"] = self.norm_language(content["language"]) + reference_content["language"] = self.norm_language(reference_content["language"]) + self.assertClose(content, reference_content, + msg=f"File {file} does not match reference {reference}") + return + with open(file) as f: + content = f.readlines() + with open(reference) as f: + reference_content = f.readlines() + self.assertEqual(content, reference_content, + msg=f"File {file} does not match reference {reference}") + + def assertClose(self, obj1, obj2, msg=None): + return self.assertEqual(self.loose(obj1), self.loose(obj2), msg=msg) + + def loose(self, obj): + # Return an approximative value of an object + if isinstance(obj, list): + return [self.loose(a) for a in obj] + if isinstance(obj, float): + f = round(obj, 1) + return 0.0 if f == -0.0 else f + if isinstance(obj, dict): + return {k: self.loose(v) for k, v in obj.items()} + if isinstance(obj, tuple): + return tuple(self.loose(list(obj))) + if isinstance(obj, set): + return self.loose(list(obj), "set") + return obj + + def get_audio_duration(self, audio_file): + # Get the duration in sec *without introducing additional dependencies* + import whisper + return len(whisper.load_audio(audio_file)) / whisper.audio.SAMPLE_RATE + + def get_device_str(self): + import torch + return "cpu" if not torch.cuda.is_available() else "cuda" + + def norm_language(self, language): + # Cheap custom stuff to avoid importing everything + return { + "japanese": "ja", + }.get(language.lower(), language) + + +class TestHelperCli(TestHelper): + + json_schema = None + + def _test_cli_(self, opts, name, files=None, extensions=["words.json"], prefix=None, one_per_call=True, device_specific=None): + """ + Test command line + opts: list of options + name: name of the test + files: list of files to process + extensions: list of extensions to check, or None to test the stdout + prefix: prefix to add to the reference files + one_per_call: if True, each file is processed separately, otherwise all files are processed by a single process + """ + + opts = opts + CMD_OPTIONS + + output_dir = self.get_output_path(name) + + input_filenames = self.get_data_files(files) + + for i, input_filename in enumerate(input_filenames): + + # Butterfly effect: Results are different depending on the device for long files + duration = self.get_audio_duration(input_filename) + if device_specific is None: + device_dependent = duration > 60 or (duration > 30 and "tiny_fr" in name) or ("empty" in input_filename and "medium_auto" in name) + else: + device_dependent = device_specific + name_ = name + if device_dependent and self.get_device_str() != "cuda": + name_ += f".{self.get_device_str()}" + + def ref_name(output_filename): + return name_ + "/" + (f"{prefix}_" if prefix else "") + os.path.basename(output_filename) + generic_name = ref_name(input_filename + ".*") + + if GENERATE_DEVICE_DEPENDENT and not device_dependent: + print("Skipping non-regression test", generic_name) + continue + + if GENERATE_NEW_ONLY and min([os.path.exists(self.get_expected_path(ref_name(output_filename))) + for output_filename in self.get_generated_files(input_filename, output_dir, extensions=extensions)] + ): + print("Skipping non-regression test", generic_name) + continue + + print("Running non-regression test", generic_name) + + if one_per_call or i == 0: + if one_per_call: + (stdout, stderr) = self.assertRun([self.main_script(), input_filename, "--output_dir", output_dir, *opts]) + else: + (stdout, stderr) = self.assertRun([self.main_script(), *input_filenames, "--output_dir", output_dir, *opts]) + print(stdout) + print(stderr) + + output_json = self.get_generated_files(input_filename, output_dir, extensions=["words.json"]).__next__() + if os.path.isfile(output_json): + self.check_json(output_json) + + if extensions is None: + output_filename = list(self.get_generated_files(input_filename, output_dir, extensions=["stdout"]))[0] + self.assertNonRegression(stdout, ref_name(output_filename), string_is_file=False) + else: + for output_filename in self.get_generated_files(input_filename, output_dir, extensions=extensions): + self.assertNonRegression(output_filename, ref_name(output_filename)) + + + shutil.rmtree(output_dir, ignore_errors=True) + + def check_json(self, json_file): + with open(json_file) as f: + content = json.load(f) + + if self.json_schema is None: + schema_file = os.path.join(os.path.dirname(__file__), "json_schema.json") + self.assertTrue(os.path.isfile(schema_file), msg=f"Schema file {schema_file} not found") + self.json_schema = json.load(open(schema_file)) + + jsonschema.validate(instance=content, schema=self.json_schema) + + + +class TestTranscribeTiny(TestHelperCli): + + def test_cli_tiny_auto(self): + self._test_cli_( + ["--model", "tiny"], + "tiny_auto", + ) + + def test_cli_tiny_fr(self): + self._test_cli_( + ["--model", "tiny", "--language", "fr"], + "tiny_fr", + ) + + +class TestTranscribeMedium(TestHelperCli): + + def test_cli_medium_auto(self): + self._test_cli_( + ["--model", "medium"], + "medium_auto", + ) + + def test_cli_medium_fr(self): + self._test_cli_( + ["--model", "medium", "--language", "fr"], + "medium_fr", + ) + + +class TestTranscribeNaive(TestHelperCli): + + def test_naive(self): + + self._test_cli_( + ["--model", "small", "--language", "en", "--efficient", "--naive"], + "naive", + files=["apollo11.mp3"], + prefix="naive", + ) + + self._test_cli_( + ["--model", "small", "--language", "en", "--accurate"], + "naive", + files=["apollo11.mp3"], + prefix="accurate", + ) + + def test_stucked_segments(self): + self._test_cli_( + ["--model", "tiny"], + "corner_cases", + files=["apollo11.mp3"], + prefix="accurate.tiny", + ) + + +class TestTranscribeCornerCases(TestHelperCli): + + def test_stucked_lm(self): + if self.skipLongTests(): + return + + self._test_cli_( + ["--model", "small", "--language", "en", "--efficient"], + "corner_cases", + files=["apollo11.mp3"], + prefix="stucked_lm", + ) + + def test_punctuation_only(self): + + # When there is only a punctuation detected in a segment, it could cause issue #24 + self._test_cli_( + ["--model", "medium.en", "--efficient", "--punctuations", "False"], + "corner_cases", + files=["empty.wav"], + prefix="issue24", + ) + + def test_temperature(self): + + self._test_cli_( + ["--model", "small", "--language", "English", + "--condition", "False", "--temperature", "0.1", "--efficient"], + "corner_cases", + files=["apollo11.mp3"], + prefix="random.nocond", + ) + + if self.skipLongTests(): + return + + self._test_cli_( + ["--model", "small", "--language", "en", "--temperature", "0.2", "--efficient"], + "corner_cases", + files=["apollo11.mp3"], + prefix="random", + ) + + def test_not_conditioned(self): + + if not os.path.exists(self.get_data_path("music.mp4", check=False)): + return + if self.skipLongTests(): + return + + self._test_cli_( + ["--model", "medium", "--language", "en", "--condition", "False", "--efficient"], + "corner_cases", + files=["music.mp4"], + prefix="nocond", + ) + + self._test_cli_( + ["--model", "medium", "--language", "en", + "--condition", "False", "--temperature", "0.4", "--efficient"], + "corner_cases", + files=["music.mp4"], + prefix="nocond.random", + ) + + def test_large(self): + if self.skipLongTests(): + return + + self._test_cli_( + ["--model", "large-v2", "--language", "en", + "--condition", "False", "--temperature", "0.4", "--efficient"], + "corner_cases", + files=["apollo11.mp3"], + prefix="large", + ) + + if os.path.exists(self.get_data_path("arabic.mp3", check=False)): + self._test_cli_( + ["--model", "large-v2", "--language", "Arabic", "--efficient"], + "corner_cases", + files=["arabic.mp3"] + ) + + def test_gloria(self): + + for model in ["medium", "large-v2"]: + for dec in ["efficient", "accurate"]: + self._test_cli_( + ["--model", model, "--language", "en", "--" + dec], + "corner_cases", + files=["gloria.mp3"], + prefix=model + "." + dec, + ) + +class TestTranscribeMonolingual(TestHelperCli): + + def test_monolingual_tiny(self): + + files = ["bonjour_vous_allez_bien.mp3"] + + self._test_cli_( + ["--model", "tiny.en", "--efficient"], + "tiny.en", + files=files, + prefix="efficient", + ) + + self._test_cli_( + ["--model", "tiny.en", "--accurate"], + "tiny.en", + files=files, + prefix="accurate", + ) + + self._test_cli_( + ["--model", "tiny.en", "--condition", "False", "--efficient"], + "tiny.en", + files=files, + prefix="nocond", + ) + + def test_monolingual_small(self): + + if os.path.exists(self.get_data_path("arabic.mp3", check=False)): + self._test_cli_( + ["--model", "small.en", "--condition", "True", "--efficient"], + "small.en", + files=["arabic.mp3"], + device_specific=True, + ) + + +class TestTranscribeWithVad(TestHelperCli): + + def test_vad_default(self): + self._test_cli_( + ["--model", "tiny", "--accurate", "--language", "en", "--vad", "True", "--verbose", "True"], + "verbose", + files=["words.wav"], + prefix="vad", + extensions=None, + ) + + def test_vad_custom_silero(self): + self._test_cli_( + ["--model", "tiny", "--accurate", "--language", "en", "--vad", "silero:v3.1", "--verbose", "True"], + "verbose", + files=["words.wav"], + prefix="vad_silero3.1", + extensions=None, + ) + self._test_cli_( + ["--model", "tiny", "--accurate", "--language", "en", "--vad", "silero:v3.0", "--verbose", "True"], + "verbose", + files=["words.wav"], + prefix="vad_silero3.0", + extensions=None, + ) + + def test_vad_custom_auditok(self): + self._test_cli_( + ["--model", "tiny", "--language", "en", "--vad", "auditok", "--verbose", "True"], + "verbose", + files=["words.wav"], + prefix="vad_auditok", + extensions=None, + ) + + +class TestTranscribeUnspacedLanguage(TestHelperCli): + + def test_japanese(self): + + self._test_cli_( + ["--model", "tiny", "--efficient"], + "tiny_auto", + files=["japanese.mp3"], + device_specific=True, + ) + + self._test_cli_( + ["--model", "tiny", "--language", "Japanese", "--efficient"], + "tiny_auto", + files=["japanese.mp3"], + prefix="jp", + device_specific=True, + ) + + self._test_cli_( + ["--model", "tiny", "--accurate"], + "tiny_auto", + files=["japanese.mp3"], + prefix="accurate", + device_specific=True, + ) + + self._test_cli_( + ["--model", "tiny", "--language", "Japanese", "--accurate"], + "tiny_auto", + files=["japanese.mp3"], + prefix="accurate_jp", + device_specific=True, + ) + +class TestTranscribeFormats(TestHelperCli): + + def test_cli_outputs(self): + files = ["punctuations.mp3", "bonjour.wav"] + extensions = ["txt", "srt", "vtt", "words.srt", "words.vtt", + "words.json", "csv", "words.csv", "tsv", "words.tsv"] + opts = ["--model", "medium", "--language", "fr"] + + # An audio / model combination that produces coma + self._test_cli_( + opts, + "punctuations_yes", + files=files, + extensions=extensions, + one_per_call=False, + ) + self._test_cli_( + opts + ["--punctuations", "False"], + "punctuations_no", + files=files, + extensions=extensions, + one_per_call=False, + ) + + def test_verbose(self): + + files = ["bonjour_vous_allez_bien.mp3"] + opts = ["--model", "tiny", "--verbose", "True"] + + self._test_cli_( + ["--efficient", *opts], + "verbose", files=files, extensions=None, + prefix="efficient.auto", + device_specific=True, + ) + + self._test_cli_( + ["--language", "fr", "--efficient", *opts], + "verbose", files=files, extensions=None, + prefix="efficient.fr", + device_specific=True, + ) + + self._test_cli_( + opts, + "verbose", files=files, extensions=None, + prefix="accurate.auto", + device_specific=True, + ) + + self._test_cli_( + ["--language", "fr", *opts], + "verbose", files=files, extensions=None, + prefix="accurate.fr", + device_specific=True, + ) + +class TestMakeSubtitles(TestHelper): + + def test_make_subtitles(self): + + main_script = self.main_script("make_subtitles.py", "whisper_timestamped_make_subtitles") + + inputs = [ + self.get_data_path("smartphone.mp3.words.json"), + self.get_data_path("no_punctuations.mp3.words.json", check=True), + self.get_data_path("yes_punctuations.mp3.words.json", check=True), + ] + + for i, input in enumerate(inputs): + filename = os.path.basename(input).replace(".words.json", "") + for len in 6, 20, 50: + output_dir = self.get_output_path() + self.assertRun([main_script, + input if i > 0 else self.get_data_path(), output_dir, + "--max_length", str(len), + ]) + for format in "vtt", "srt",: + output_file = os.path.join(output_dir, f"{filename}.{format}") + self.assertTrue(os.path.isfile(output_file), msg=f"File {output_file} not found") + expected_file = f"split_subtitles/{filename.split('_')[-1]}_{len}.{format}" + self.assertNonRegression(output_file, expected_file) + os.remove(output_file) + self.assertRun([main_script, + input, output_file, + "--max_length", str(len), + ]) + self.assertTrue(os.path.isfile(output_file), msg=f"File {output_file} not found") + self.assertNonRegression(output_file, expected_file) + +class TestHuggingFaceModel(TestHelperCli): + + def test_hugging_face_model(self): + + self._test_cli_( + ["--model", "qanastek/whisper-tiny-french-cased", "--verbose", "True"], + "verbose", files=["bonjour.wav"], extensions=None, + prefix="hf", + device_specific=True, + ) + +# "ZZZ" to run this test at last (because it will fill the CUDA with some memory) +class TestZZZPythonImport(TestHelper): + + def test_python_import(self): + + try: + import whisper_timestamped + except ModuleNotFoundError: + sys.path.append(os.path.realpath( + os.path.dirname(os.path.dirname(__file__)))) + import whisper_timestamped + + # Test version + version = whisper_timestamped.__version__ + self.assertTrue(isinstance(version, str)) + + (stdout, sterr) = self.assertRun([self.main_script(), "-v"]) + self.assertEqual(stdout.strip(), version) + + model = whisper_timestamped.load_model("tiny") + + # Check processing of different files + for filename in "bonjour.wav", "laugh1.mp3", "laugh2.mp3": + res = whisper_timestamped.transcribe( + model, self.get_data_path(filename)) + if self._can_generate_reference(): + self.assertNonRegression(res, f"tiny_auto/{filename}.words.json") + + for filename in "bonjour.wav", "laugh1.mp3", "laugh2.mp3": + res = whisper_timestamped.transcribe( + model, self.get_data_path(filename), language="fr") + if self._can_generate_reference(): + self.assertNonRegression(res, f"tiny_fr/{filename}.words.json") + + def _can_generate_reference(self): + return not GENERATE_DEVICE_DEPENDENT or self.get_device_str() != "cpu" + + def test_split_tokens(self): + + import whisper + whisperversion = whisper.__version__ + + import whisper_timestamped as whisper + from whisper_timestamped.transcribe import split_tokens_on_spaces + + tokenizer = whisper.tokenizer.get_tokenizer(True, language=None) + + # 220 means space + tokens = [50364, 220, 6455, 11, 2232, 11, 286, 2041, 11, 2232, 11, 8660, + 291, 808, 493, 220, 365, 11, 220, 445, 718, 505, 458, 13, 220, 50714] + + self.assertEqual( + split_tokens_on_spaces(tokens, tokenizer), + (['<|0.00|>', 'So,', 'uh,', 'I', 'guess,', 'uh,', 'wherever', 'you', 'come', 'up', 'with,', 'just', 'let', 'us', 'know.', '<|7.00|>'], + [['<|0.00|>'], + [' ', 'So', ','], + [' uh', ','], + [' I'], + [' guess', ','], + [' uh', ','], + [' wherever'], + [' you'], + [' come'], + [' up'], + [' ', ' with', ','], + [' ', ' just'], + [' let'], + [' us'], + [' know', '.', ' '], + ['<|7.00|>']], + [[50364], + [220, 6455, 11], + [2232, 11], + [286], + [2041, 11], + [2232, 11], + [8660], + [291], + [808], + [493], + [220, 365, 11], + [220, 445], + [718], + [505], + [458, 13, 220], + [50714] + ]) + ) + + tokens = [50366, 314, 6, 11771, 17134, 11, 4666, 11, 1022, 220, 875, 2557, 68, 11, 6992, 631, 269, 6, 377, 220, 409, 7282, 1956, 871, 566, 2707, 394, 1956, 256, 622, 8208, 631, 8208, 871, 517, 7282, 1956, 5977, 7418, 371, 1004, 306, 580, 11, 5977, 12, 9498, 9505, 84, 6, 50416] + self.assertEqual( + split_tokens_on_spaces(tokens, tokenizer), + ( + ['<|0.04|>', "T'façon,", 'nous,', 'sur', 'la', 'touche,', 'parce', 'que', "c'est", 'un', 'sport', 'qui', 'est', 'important', 'qui', 'tue', 'deux', 'que', 'deux', 'est', 'un', 'sport', 'qui', 'peut', 'être', 'violent,', 'peut-être', "qu'", '<|1.04|>'], + [['<|0.04|>'], + [' T', "'", 'fa', 'çon', ','], + [' nous', ','], + [' sur'], + [' ', 'la'], + [' touch', 'e', ','], + [' parce'], + [' que'], + [' c', "'", 'est'], + [' ', 'un'], + [' sport'], + [' qui'], + [' est'], + [' im', 'port', 'ant'], + [' qui'], + [' t', 'ue'], + [' deux'], + [' que'], + [' deux'], + [' est'], + [' un'], + [' sport'], + [' qui'], + [' peut'], + [' être'], + [' v', 'io', 'le', 'nt', ','], + [' peut', '-', 'être'], + [' q', 'u', "'"], + ['<|1.04|>']], + [[50366], + [314, 6, 11771, 17134, 11], + [4666, 11], + [1022], + [220, 875], + [2557, 68, 11], + [6992], + [631], + [269, 6, 377], + [220, 409], + [7282], + [1956], + [871], + [566, 2707, 394], + [1956], + [256, 622], + [8208], + [631], + [8208], + [871], + [517], + [7282], + [1956], + [5977], + [7418], + [371, 1004, 306, 580, 11], + [5977, 12, 9498], + [9505, 84, 6], + [50416]] + ) + ) + + tokens = [50364, 220, 220, 6455, 11, 220, 220, 2232, 220, 220, 11, 220, 50714] + self.assertEqual( + split_tokens_on_spaces(tokens, tokenizer), + (['<|0.00|>', 'So,', 'uh', ',', '<|7.00|>'], + [['<|0.00|>'], + [' ', ' ', 'So', ','], + [' ', ' ', ' uh'], + [' ', ' ', ',', ' '], + ['<|7.00|>']], + [[50364], [220, 220, 6455, 11], [220, 220, 2232], [220, 220, 11, 220], [50714]] + ) + ) + + # Careful with the double spaces at the end... + tokens = [50364, 220, 220, 6455, 11, 220, 220, 2232, 220, 220, 11, 220, 220, 50714] + self.assertEqual( + split_tokens_on_spaces(tokens, tokenizer), + (['<|0.00|>', 'So,', 'uh', ',', '', '<|7.00|>'], + [['<|0.00|>'], + [' ', ' ', 'So', ','], + [' ', ' ', ' uh'], + [' ', ' ', ','], + [' ', ' '], + ['<|7.00|>']], + [[50364], [220, 220, 6455, 11], [220, 220, 2232], [220, 220, 11], [220, 220], [50714]] + ) + ) + + # Tokens that could be removed + tokens = [50364, 6024, 95, 8848, 7649, 8717, 38251, 11703, 3224, 51864] + self.assertEqual( + split_tokens_on_spaces(tokens, tokenizer), + (['<|0.00|>', 'الآذان', 'نسمّه', '<|30.00|>'], + [['<|0.00|>'], ['', ' الآ', 'ذ', 'ان'], [' ن', 'سم', 'ّ', 'ه'], ['<|30.00|>']], + [[50364], [6024, 95, 8848, 7649], [8717, 38251, 11703, 3224], [51864]] + ) + ) + + # issue #61 + # Special tokens that are not timestamps + tokens = [50414, 805, 12, 17, 50299, 11, 568, 12, 18, 12, 21, 11, 502, 12, 17, 12, 51464] + # 50299 is "<|te|>" and appears as "" + te = "" + self.assertEqual( + split_tokens_on_spaces(tokens, tokenizer), + (['<|1.00|>', f'3-2{te},', '2-3-6,', '1-2-', '<|22.00|>'], + [['<|1.00|>'], [' 3', '-', '2', f'{te}', ','], [' 2', '-', '3', '-','6', ','], [' 1', '-', '2', '-'], ['<|22.00|>']], + [[50414], [805, 12, 17, 50299, 11], [568, 12, 18, 12, 21, 11], [502, 12, 17, 12], [51464]]) + ) + + tokenizer = whisper.tokenizer.get_tokenizer(False, language="en") + + # Just a punctuation character + tokens = [50363, 764, 51813] + + _dot = "." if whisperversion < "20230314" else " ." + self.assertEqual( + split_tokens_on_spaces(tokens, tokenizer), + (['<|0.00|>', ".", '<|29.00|>'], + [['<|0.00|>'], [_dot], ['<|29.00|>']], + [[50363], [764], [51813]] + ) + ) diff --git a/whisper_timestamped/__init__.py b/whisper_timestamped/__init__.py new file mode 100644 index 0000000000000000000000000000000000000000..24fd61eeea212883b618d1fb974d40ab24f07ec0 --- /dev/null +++ b/whisper_timestamped/__init__.py @@ -0,0 +1,10 @@ +from whisper import available_models, _download, _MODELS # defined in __init__.py +from whisper import audio, decoding, model, normalizers, tokenizer, utils +from whisper.audio import load_audio, log_mel_spectrogram, pad_or_trim +from whisper.decoding import DecodingOptions, DecodingResult, decode, detect_language +from whisper.model import Whisper, ModelDimensions + +from .transcribe import transcribe_timestamped +from .transcribe import transcribe_timestamped as transcribe +from .transcribe import load_model +from .transcribe import __version__ \ No newline at end of file diff --git a/whisper_timestamped/make_subtitles.py b/whisper_timestamped/make_subtitles.py new file mode 100644 index 0000000000000000000000000000000000000000..bfc49ceda111efd3ac8065b082276aed26e79977 --- /dev/null +++ b/whisper_timestamped/make_subtitles.py @@ -0,0 +1,157 @@ +#!/usr/bin/env python3 + +import json +import string + +_punctuation = "".join(c for c in string.punctuation if c not in ["-", "'"]) + "。,!?:”、…" + +def split_long_segments(segments, max_length, use_space = True): + new_segments = [] + for segment in segments: + text = segment["text"] + if len(text) <= max_length: + new_segments.append(segment) + else: + meta_words = segment["words"] + # Note: we do this in case punctuation were removed from words + if use_space: + # Split text around spaces and punctuations (keeping punctuations) + words = text.split() + else: + words = [w["text"] for w in meta_words] + if len(words) != len(meta_words): + new_words = [w["text"] for w in meta_words] + print(f"WARNING: {' '.join(words)} != {' '.join(new_words)}") + words = new_words + current_text = "" + current_start = segment["start"] + current_best_idx = None + current_best_end = None + current_best_next_start = None + for i, (word, meta) in enumerate(zip(words, meta_words)): + current_text_before = current_text + if current_text and use_space: + current_text += " " + current_text += word + + if len(current_text) > max_length and len(current_text_before): + start = current_start + if current_best_idx is not None: + text = current_text[:current_best_idx] + end = current_best_end + current_text = current_text[current_best_idx+1:] + current_start = current_best_next_start + else: + text = current_text_before + end = meta_words[i-1]["end"] + current_text = word + current_start = meta["start"] + + current_best_idx = None + current_best_end = None + current_best_next_start = None + + new_segments.append({"text": text, "start": start, "end": end}) + + # Try to cut after punctuation + if current_text and current_text[-1] in _punctuation: + current_best_idx = len(current_text) + current_best_end = meta["end"] + current_best_next_start = meta_words[i+1]["start"] if i+1 < len(meta_words) else None + + if len(current_text): + new_segments.append({"text": current_text, "start": current_start, "end": segment["end"]}) + + return new_segments + +def format_timestamp(seconds: float, always_include_hours: bool = False, decimal_marker: str = '.'): + assert seconds >= 0, "non-negative timestamp expected" + milliseconds = round(seconds * 1000.0) + + hours = milliseconds // 3_600_000 + milliseconds -= hours * 3_600_000 + + minutes = milliseconds // 60_000 + milliseconds -= minutes * 60_000 + + seconds = milliseconds // 1_000 + milliseconds -= seconds * 1_000 + + hours_marker = f"{hours:02d}:" if always_include_hours or hours > 0 else "" + return f"{hours_marker}{minutes:02d}:{seconds:02d}{decimal_marker}{milliseconds:03d}" + +def write_vtt(result, file): + print("WEBVTT\n", file=file) + for segment in result: + print( + f"{format_timestamp(segment['start'])} --> {format_timestamp(segment['end'])}\n" + f"{segment['text'].strip().replace('-->', '->')}\n", + file=file, + flush=True, + ) + +def write_srt(result, file): + for i, segment in enumerate(result, start=1): + # write srt lines + print( + f"{i}\n" + f"{format_timestamp(segment['start'], always_include_hours=True, decimal_marker=',')} --> " + f"{format_timestamp(segment['end'], always_include_hours=True, decimal_marker=',')}\n" + f"{segment['text'].strip().replace('-->', '->')}\n", + file=file, + flush=True, + ) + +def cli(): + + import os + import argparse + + supported_formats = ["srt", "vtt"] + + parser = argparse.ArgumentParser( + description='Convert .word.json transcription files (output of whisper_timestamped) to srt or vtt, being able to cut long segments', + formatter_class=argparse.ArgumentDefaultsHelpFormatter + ) + parser.add_argument('input', type=str, help='Input json file, or input folder') + parser.add_argument('output', type=str, help='Output srt or vtt file, or output folder') + parser.add_argument('--max_length', default=200, help='Maximum length of a segment in characters', type=int) + parser.add_argument('--format', type=str, default="all", help='Output format (if the output is a folder, i.e. not a file with an explicit extension)', choices= supported_formats + ["all"]) + args = parser.parse_args() + + if os.path.isdir(args.input) or not max([args.output.endswith(e) for e in supported_formats]): + input_files = [f for f in os.listdir(args.input) if f.endswith(".words.json")] if os.path.isdir(args.input) else [os.path.basename(args.input)] + extensions = [args.format] if args.format != "all" else ["srt", "vtt"] + output_files = [[os.path.join(args.output, f[:-11] + "." + e) for e in extensions] for f in input_files] + if os.path.isdir(args.input): + input_files = [os.path.join(args.input, f) for f in input_files] + else: + input_files = [args.input] + if not os.path.isdir(args.output): + os.makedirs(args.output) + else: + input_files = [args.input] + output_files = [[args.output]] + if not os.path.isdir(os.path.dirname(args.output)): + os.makedirs(os.path.dirname(args.output)) + + for fn, outputs in zip(input_files, output_files): + with open(fn, "r", encoding="utf-8") as f: + transcript = json.load(f) + segments = transcript["segments"] + if args.max_length: + language = transcript["language"] + use_space = language not in ["zh", "ja", "th", "lo", "my"] + segments = split_long_segments(segments, args.max_length, use_space=use_space) + for output in outputs: + if output.endswith(".srt"): + with open(output, "w", encoding="utf-8") as f: + write_srt(segments, file=f) + elif output.endswith(".vtt"): + with open(output, "w", encoding="utf-8") as f: + write_vtt(segments, file=f) + else: + raise RuntimeError(f"Unknown output format for {output}") + +if __name__ == "__main__": + cli() \ No newline at end of file diff --git a/whisper_timestamped/transcribe.py b/whisper_timestamped/transcribe.py new file mode 100644 index 0000000000000000000000000000000000000000..3f91d8d3e968e6432ac01600d682600c8bac3740 --- /dev/null +++ b/whisper_timestamped/transcribe.py @@ -0,0 +1,2646 @@ +#!/usr/bin/env python3 + +__author__ = "Jérôme Louradour" +__credits__ = ["Jérôme Louradour"] +__license__ = "GPLv3" +__version__ = "1.14.2" + +# Set some environment variables +import os +os.environ['TF_CPP_MIN_LOG_LEVEL'] = '1' # Remove warning "This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN)..." +os.environ['CUDA_DEVICE_ORDER'] = 'PCI_BUS_ID' # GPU in the right order + +# Whisper and Torch +import whisper +import torch +import torch.nn.functional as F + +from importlib.util import find_spec +if find_spec("intel_extension_for_pytorch") is not None: + try: + import intel_extension_for_pytorch + except ImportError: + pass + +# For alignment +import numpy as np +import dtw +# from scipy.signal import medfilt as median_filter +from scipy.ndimage import median_filter # faster owing to https://github.com/openai/whisper/commit/f0083e7eb20d032390e42f6f6039947fa8669c93 +from scipy.signal import find_peaks + +# Additional +import string +import csv +import sys +import gzip, base64 +import copy +import re +import shutil + +# Constant variables +from whisper.utils import format_timestamp +from whisper.audio import N_FRAMES, HOP_LENGTH, SAMPLE_RATE # 3000, 160, 16000 +AUDIO_SAMPLES_PER_TOKEN = HOP_LENGTH * 2 # 320 +AUDIO_TIME_PER_TOKEN = AUDIO_SAMPLES_PER_TOKEN / SAMPLE_RATE # 0.02 (sec) +SEGMENT_DURATION = N_FRAMES * HOP_LENGTH / SAMPLE_RATE # 30.0 (sec) + +# Logs +import logging +logger = logging.getLogger("whisper_timestamped") + +USE_EFFICIENT_BY_DEFAULT = True +TRUST_WHISPER_TIMESTAMP_BY_DEFAULT = True +DISFLUENCY_MARK = "[*]" + +try: + whisper_version = whisper.__version__ +except NameError: + whisper_version = "" +WHIPSER_GE_20230306 = whisper_version >= "20230306" +WHIPSER_GE_20230308 = whisper_version >= "20230308" + +def transcribe_timestamped( + # Main Whisper options + model, + audio, + language=None, + task="transcribe", + + # Additional options for word alignment + remove_punctuation_from_words=False, + compute_word_confidence=True, + include_punctuation_in_confidence=False, + refine_whisper_precision=0.5, + min_word_duration=0.02, # Was 0.04 before 1.11 + plot_word_alignment=False, + word_alignement_most_top_layers=None, # Was 6 before 1.9 + remove_empty_words=False, + + # Reproducibility + seed=1234, + + vad=False, + detect_disfluencies=False, + trust_whisper_timestamps=TRUST_WHISPER_TIMESTAMP_BY_DEFAULT, + naive_approach=False, + + # Other Whisper options + temperature=0.0 if USE_EFFICIENT_BY_DEFAULT else (0.0, 0.2, 0.4, 0.6, 0.8, 1.0), + best_of=None, + beam_size=None, + patience=None, + length_penalty=None, + compression_ratio_threshold=2.4, + logprob_threshold=-1.0, + no_speech_threshold=0.6, + fp16=None, + condition_on_previous_text=True, + initial_prompt=None, + suppress_tokens="-1", + sample_len=None, + verbose=False, +): + """ + Transcribe an audio file using Whisper + + Parameters + ---------- + model: Whisper + The Whisper model instance. + + audio: Union[str, np.ndarray, torch.Tensor] + The path to the audio file to open, or the audio waveform in 16kHz. + + language: str + The language to use for the transcription. If None, the language is detected automatically. + + task: str + The task to perform: either "transcribe" or "translate". + + remove_punctuation_from_words: bool + If False, words will be glued with the next punctuation mark (if any). + If True, there will be no punctuation mark in the `words[:]["text"]` list. + It only affects these strings; This has no influence on the computation of the word confidence, whatever the value of `include_punctuation_in_confidence` is. + + include_punctuation_in_confidence: bool + Whether to include proba of punctuation in the computation of the (previous) word confidence. + + compute_word_confidence: bool + Whether to compute word confidence. + If True, a finer confidence for each segment will be computed as well. + + vad: bool or str in ["silero", "silero:3.1", "auditok"] + Whether to perform voice activity detection (VAD) on the audio file, to remove silent parts before transcribing with Whisper model. + This should decrease hallucinations from the Whisper model. + When set to True, the default VAD algorithm is used (silero). + When set to a string, the corresponding VAD algorithm is used (silero, silero:3.1 or auditok). + Note that the library for the corresponding VAD algorithm must be installed. + + detect_disfluencies: bool + Whether to detect disfluencies (i.e. hesitations, filler words, repetitions, corrections, etc.) that Whisper model might have omitted in the transcription. + This should make the word timestamp prediction more accurate. + And probable disfluencies will be marked as special words "[*]". + + trust_whisper_timestamps: bool + Whether to rely on Whisper's timestamps to get approximative first estimate of segment positions (up to refine_whisper_precision). + + refine_whisper_precision: float + How much can we refine Whisper segment positions, in seconds. Must be a multiple of 0.02. + + min_word_duration: float + Minimum duration of a word, in seconds. If a word is shorter than this, timestamps will be adjusted. + + plot_word_alignment: bool + Whether to plot the word alignment for each segment. matplotlib must be installed to use this option. + + remove_empty_words: bool + Whether to remove words with no duration occuring at the end of segments (probable Whisper hallucinations). + + seed: int + Random seed to use for temperature sampling, for the sake of reproducibility. + Choose None for unpredictable randomness. + + naive_approach: bool + Force the naive approach that consists in decoding twice the audio file, once to get the transcritpion and once with the decoded tokens to get the alignment. + Note that this approach is used anyway when beam_size is not None and/or when the temperature is a list with more than one element. + + temperature: float + Temperature for sampling. + + compression_ratio_threshold: float + If the gzip compression ratio is above this value, treat as failed. + + logprob_threshold: float + If the average log probability over sampled tokens is below this value, treat as failed. + + no_speech_threshold: float + If the no_speech probability is higher than this value AND the average log probability + over sampled tokens is below `logprob_threshold`, consider the segment as silent. + + condition_on_previous_text: bool + if True, the previous output of the model is provided as a prompt for the next window; + disabling may make the text inconsistent across windows, but the model becomes less prone to + getting stuck in a failure loop, such as repetition looping or timestamps going out of sync. + + initial_prompt: str + Optional text to provide as a prompt for the first window. + + suppress_tokens: str + Comma-separated list of token ids to suppress during sampling; + '-1' will suppress most special characters except common punctuations. + + verbose: bool + Whether to display the text being decoded to the console. If True, displays all the details, + If False, displays minimal details. If None, does not display anything + + Returns + ------- + A dictionary containing the resulting text ("text") and segment-level details ("segments"), and + the spoken language ("language"), which is detected when `decode_options["language"]` is None. + """ + + if seed is not None: + torch.manual_seed(seed) + torch.cuda.manual_seed_all(seed) + + # Check input options + assert refine_whisper_precision >= 0 and refine_whisper_precision / AUDIO_TIME_PER_TOKEN == round(refine_whisper_precision / AUDIO_TIME_PER_TOKEN), f"refine_whisper_precision must be a positive multiple of {AUDIO_TIME_PER_TOKEN}" + refine_whisper_precision_nframes = round(refine_whisper_precision / AUDIO_TIME_PER_TOKEN) + assert min_word_duration >= 0, f"min_word_duration must be a positive number" + assert word_alignement_most_top_layers is None or word_alignement_most_top_layers > 0, f"word_alignement_most_top_layers must be a strictly positive number" + + if isinstance(temperature, (list, tuple)) and len(temperature) == 1: + temperature = temperature[0] + if isinstance(temperature, (list, tuple)): + # temperature fallback + naive_approach = True + elif temperature > 0 and best_of is not None and best_of > 1: + naive_approach = True + if beam_size is not None: + # beam-search + naive_approach = True + + # Input options + vad = check_vad_method(vad) + if isinstance(model, str): + model = load_model(model) + if fp16 is None: + fp16 = model.device != torch.device("cpu") + + # Safety check + input_stride = N_FRAMES // model.dims.n_audio_ctx + time_precision = input_stride * HOP_LENGTH / SAMPLE_RATE + assert time_precision == AUDIO_TIME_PER_TOKEN + + alignment_heads = get_alignment_heads(model) if word_alignement_most_top_layers is None else None + if alignment_heads is None and word_alignement_most_top_layers is None: + word_alignement_most_top_layers = 6 + + alignment_options = dict( + remove_punctuation_from_words=remove_punctuation_from_words, + compute_word_confidence=compute_word_confidence, + include_punctuation_in_confidence=include_punctuation_in_confidence, + detect_disfluencies=detect_disfluencies, + refine_whisper_precision_nframes=refine_whisper_precision_nframes, + plot_word_alignment=plot_word_alignment, + word_alignement_most_top_layers=word_alignement_most_top_layers, + alignment_heads=alignment_heads, + ) + whisper_options = dict( + language=language, + task=task, + fp16=fp16, + temperature=temperature, + best_of=best_of, + beam_size=beam_size, + patience=patience, + length_penalty=length_penalty, + condition_on_previous_text=condition_on_previous_text, + initial_prompt=initial_prompt, + suppress_tokens=suppress_tokens, + sample_len=sample_len, + verbose=verbose if (not vad or verbose is not True) else False, + ) + other_options = dict( + no_speech_threshold=no_speech_threshold, + logprob_threshold=logprob_threshold, + compression_ratio_threshold=compression_ratio_threshold, + ) + + if vad: + audio = get_audio_tensor(audio) + audio, convert_timestamps = remove_non_speech(audio, method=vad, plot=plot_word_alignment) + + global num_alignment_for_plot + num_alignment_for_plot = 0 + + if naive_approach: + (transcription, words) = _transcribe_timestamped_naive(model, audio, + min_word_duration=0.0, # Was 0.04 before 1.11 + trust_whisper_timestamps=trust_whisper_timestamps, + **alignment_options, **whisper_options, **other_options) + else: + (transcription, words) = _transcribe_timestamped_efficient(model, audio, + trust_whisper_timestamps=trust_whisper_timestamps, + **alignment_options, **whisper_options, **other_options) + if remove_empty_words: + # Remove words with empty duration happening at the end of segments, to remove some hallucinations + transcription, words = remove_last_null_duration_words(transcription, words, recompute_text=True) + + # Refine word positions + ensure_increasing_positions(words, min_duration=min_word_duration if trust_whisper_timestamps else 0) + + # Combine words and segments + whisper_segments = transcription["segments"] + for word in words: + if verbose and not naive_approach and not vad: + print_timestamped(word) + word.pop("tokens") + word.pop("tokens_indices") + if "avg_logprob_reliable" in word: + word.pop("avg_logprob_reliable") + idx_segment = word.pop("idx_segment") + assert idx_segment < len(whisper_segments), f"Fatal error: Got unexpected segment index {idx_segment} >= {len(whisper_segments)}" + segment = whisper_segments[idx_segment] + if "words" in segment: + segment["words"].append(word) + else: + segment["words"] = [word] + if refine_whisper_precision: + segment["start"] = word["start"] + if refine_whisper_precision: + segment["end"] = word["end"] + + if vad: + # Recompute timestamps to match the original audio + for segment in whisper_segments: + for word in segment.get("words", []): + word["start"], word["end"] = convert_timestamps(word["start"], word["end"]) + if verbose: + print_timestamped(word) + if refine_whisper_precision and len(segment.get("words", [])): + segment["start"] = segment["words"][0]["start"] + segment["end"] = segment["words"][-1]["end"] + else: + segment["start"], segment["end"] = convert_timestamps(segment["start"], segment["end"]) + + return transcription + +def _transcribe_timestamped_efficient( + model, + audio, + remove_punctuation_from_words, + compute_word_confidence, + include_punctuation_in_confidence, + refine_whisper_precision_nframes, + alignment_heads, + plot_word_alignment, + word_alignement_most_top_layers, + detect_disfluencies, + trust_whisper_timestamps, + use_timestamps_for_alignment = True, + # Whisper specific options + **whisper_options, +): + + # Get options + sample_len = whisper_options["sample_len"] + temperature = whisper_options["temperature"] + no_speech_threshold = whisper_options["no_speech_threshold"] + logprob_threshold = whisper_options["logprob_threshold"] + verbose = whisper_options["verbose"] + # Note: "on-the-fly" verbose is not implementable in the current state (we don't know the absolute position of the current chunk). See issue #18 + verbose_bugged = False + whisper_options["verbose"] = None if whisper_options["verbose"] is True else whisper_options["verbose"] # We will print intermediate results ourselves + + logit_filters = get_logit_filters(model, whisper_options) + language = whisper_options["language"] + tokenizer = get_tokenizer(model, task=whisper_options["task"], language=language) + + max_sample_len = sample_len or model.dims.n_text_ctx // 2 + n_ctx = model.dims.n_text_ctx + + debug = logger.getEffectiveLevel() >= logging.DEBUG + + word_alignement_most_top_layers = float("inf") if word_alignement_most_top_layers is None else word_alignement_most_top_layers + + # The main outcome + timestamped_word_segments = [] # list of timestamped word segments that have been collected so far + # Main variables to be accumulated + segment_tokens = [[]] # list of lists of token indices that have been collected so far (one list per segment) + segment_attweights = [[] for _ in range(min(word_alignement_most_top_layers, len(model.decoder.blocks)))] + # attention weights on the last segments + segment_avglogprobs = [] # average log probability for each segment (actually of the corresponding chunk, as computed by whisper) + segment_logprobs = [] # token log probabilities for each segment + # Variables related to options that can skip some segments + sot_index = None # index of the SOT token in the current set of processed tokens + no_speech_prob = None # no speech probability for the current 30 sec chunk + chunk_logprobs = [] # log probabilities for the current 30 sec chunk + chunk_tokens = [] # tokens for the current 30 sec chunk (list of Torch tensors) + chunk_tokens_nosot = [] # tokens for the current 30 sec chunk, without the SOT tokens (list of indices) + last_chunk_token = None # last token of the current chunk, that may be needed for corner cases + last_token_fallback = None # last token to use as a fallback if the model gets stuck + has_started = False # whether we have started decoding + mfcc = None # MFCC features for the current 30 sec chunk + new_mfcc = None # + num_inference_steps = 0 # number of inference steps performed so far (for debugging only) + language_probs = None # language detection probabilities + + def is_sot(curr_tokens): + return curr_tokens is None or len(curr_tokens) > 1 or curr_tokens[0] == tokenizer.sot + + def has_reached_decoding_limit(): + n = len(chunk_tokens_nosot) + 1 + m = n + (len(chunk_tokens[0]) if len(chunk_tokens) > 0 else 0) + return n + 1 >= max_sample_len or m > n_ctx + + def reset(add_segment, keep_last_token=True): + """ Reset the list of tokens for the current speech segment, and corresponding cross-attention weights """ + nonlocal segment_tokens, segment_attweights + if add_segment: + if keep_last_token: + segment_tokens.append([segment_tokens[-1][-1]]) + segment_attweights = [w[-1:] for w in segment_attweights] + else: + segment_tokens.append([]) + segment_attweights = [[] for w in segment_attweights] + segment_tokens[-2].pop(0) + elif len(segment_tokens[-1]) > 0: + if debug: + logger.debug(f"Reset last segment: {tokenizer.decode_with_timestamps(segment_tokens[-1])}") + segment_tokens[-1] = [] + segment_attweights = [[] for w in segment_attweights] + + saw_consecutive_timestamps = False + def must_flush_segment(curr_tokens): + """ Return whether or not the previously collected tokens must be used to add a new speech segment """ + nonlocal segment_tokens, saw_consecutive_timestamps, chunk_tokens_nosot + + if not is_sot(curr_tokens): + is_timestamp = curr_tokens[0] >= tokenizer.timestamp_begin + is_previous_timestamp = segment_tokens[-1][-1] >= tokenizer.timestamp_begin if len(segment_tokens[-1]) > 0 else False + consecutive_timestamps = is_timestamp and is_previous_timestamp + if consecutive_timestamps: + saw_consecutive_timestamps = True + return consecutive_timestamps + else: # Several tokens as a prompt or must flush last segments + + must_flush = len(segment_tokens[-1]) > 1 and not saw_consecutive_timestamps + if not must_flush and WHIPSER_GE_20230306: # If the last token is a timestamp, the last segment is used + if last_chunk_token is None: + must_flush = (len(segment_tokens[-1]) > 2 and segment_tokens[-1][-1] >= tokenizer.timestamp_begin) + else: + must_flush = (last_chunk_token >= tokenizer.timestamp_begin) + if not must_flush and trust_whisper_timestamps: + # Discard the end of the last transcription + reset(False) + saw_consecutive_timestamps = False + return must_flush + + index_begin_30sec_chunck = 0 + def get_index_begin_30sec_chunck(curr_tokens): + nonlocal index_begin_30sec_chunck, has_started + + if is_sot(curr_tokens) and has_started: + if trust_whisper_timestamps: + res = index_begin_30sec_chunck + index_begin_30sec_chunck = len(segment_tokens)-1 + else: + res = len(segment_tokens)-1 + return res + + def align_last_segment(curr_tokens=None): + nonlocal segment_tokens, segment_attweights, timestamped_word_segments, has_started, no_speech_prob, chunk_tokens, chunk_tokens_nosot, chunk_logprobs, mfcc, new_mfcc, logit_filters, index_begin_30sec_chunck, last_token_fallback, num_inference_steps + + if debug and trust_whisper_timestamps: + logger.debug(f"Add segment {len(timestamped_word_segments)+1} at step {num_inference_steps}:\n\t{tokenizer.decode_with_timestamps(segment_tokens[-1])}") + + tokens = segment_tokens[-1][1:] + + # When the decoding hit the max limit (number of tokens) -- usually when the language model gets stuck -- + # then we have to recover the last token from what is send to the decoder + unfinished_decoding = has_reached_decoding_limit() + last_is_not_timestamp = len(tokens) and tokens[-1] < tokenizer.timestamp_begin + last_token_reliable = True + + if unfinished_decoding: + logger.debug(f"WARNING: decoding hit the max limit for segment {segment_tokens[-1]} (It usually happens when the language model gets stuck)") + # The last token chosen is in the prompt for the new chunk + if curr_tokens is not None and curr_tokens[0] == tokenizer.sot_prev: + index_sot = (curr_tokens == tokenizer.sot).nonzero(as_tuple=True) + assert len(index_sot) == 1 + index_sot = index_sot[0].item() + assert index_sot > 0 + last_token_fallback = curr_tokens[index_sot-1].item() + logger.debug(f" Guessed last token from the prompt for the new chunk: {last_token_fallback}") + # Fallback for the last segment, or without prompt: Assume greedy decoding + else: + last_token_fallback = torch.argmax(chunk_logprobs[-1]).item() if last_chunk_token is None else last_chunk_token + last_token_reliable = (temperature == 0) + logger.debug(f" Guess last token using probas (assuming greedy decoding): {last_token_fallback}") + if debug: + logger.debug(f"WARNING: also add last token: {tokenizer.decode_with_timestamps([last_token_fallback])}") + + tokens.append(last_token_fallback) + segment_tokens[-1].append(last_token_fallback) + attention_weights = [torch.cat(w, dim=-2) for w in segment_attweights] + last_logprobs = chunk_logprobs[-1] + elif last_is_not_timestamp: # was emitted early, without a timestamp before + logger.debug(f"WARNING: end timestamp not produced. Adding <|endoftext|>") + tokens.append(tokenizer.eot) + segment_tokens[-1].append(tokenizer.eot) + attention_weights = [torch.cat(w, dim=-2) for w in segment_attweights] + last_logprobs = chunk_logprobs[-1] + else: + attention_weights = [torch.cat(w[:-1], dim=-2) for w in segment_attweights] + last_logprobs = chunk_logprobs[-2] + + # Check prediction of last token + end_token = tokens[-1] + if end_token >= tokenizer.timestamp_begin: + start_token = tokens[0] + assert start_token >= tokenizer.timestamp_begin + # If Whisper prediction of the end is obviously wrong, we predict it again (constrained) + if end_token <= start_token: + new_end_token = last_logprobs[start_token+1:].argmax() + start_token + 1 + tokens[-1] = new_end_token.item() + if debug: + logger.debug(f"Re-estimated end token {tokenizer.decode_with_timestamps([new_end_token])} (was {tokenizer.decode_with_timestamps([end_token])}) to be after start token {tokenizer.decode_with_timestamps([start_token])}") + + if len(tokens) <= 1: + # Corner case: nothing in between timestamps + ws = [] + else: + ws = perform_word_alignment( + tokens, + attention_weights, + tokenizer, + use_space=should_use_space(language), + alignment_heads=alignment_heads, + remove_punctuation_from_words=remove_punctuation_from_words, + refine_whisper_precision_nframes=refine_whisper_precision_nframes, + detect_disfluencies=detect_disfluencies, + unfinished_decoding=unfinished_decoding, + mfcc=mfcc, + plot=plot_word_alignment, + debug=debug, + ) + + add_segment = len(ws) > 0 + if add_segment: + timestamped_word_segments.append(ws) + else: + logger.debug(f"Not added!") + reset(add_segment, not is_sot(curr_tokens)) + + return add_segment, unfinished_decoding, last_token_reliable + + def may_flush_segment(curr_tokens = None): + """ Add a speech segment with the new tokens if necessary. + May also remove the last collected segments if filtered out by Whisper (no_speech_prob <= no_speech_threshold) + """ + nonlocal segment_tokens, segment_attweights, timestamped_word_segments, segment_logprobs, has_started, no_speech_prob, chunk_tokens, chunk_tokens_nosot, chunk_logprobs, mfcc, new_mfcc, logit_filters, index_begin_30sec_chunck, last_token_fallback, num_inference_steps, last_chunk_token + + # Check if a new segment should be added + unfinished_decoding = False + last_token_reliable = True + + if must_flush_segment(curr_tokens) and trust_whisper_timestamps: + _, unfinished_decoding, last_token_reliable = align_last_segment(curr_tokens) + + i_start = get_index_begin_30sec_chunck(curr_tokens) + + # All segments from previous 30sec chunck have been collected + if i_start is not None: + + if not trust_whisper_timestamps: + + tokens = torch.Tensor(segment_tokens[-1]).int() + idx_task = torch.where(tokens==tokenizer.sot_sequence[-1])[0][0].item() # index of <|transcribe|> + + is_special = tokens.ge(tokenizer.eot) + # Remove prompt + is_special[:idx_task] = True + # Keep begin timestamp + is_special[idx_task:idx_task+2] = False + + is_timestamp = tokens.ge(tokenizer.timestamp_begin) + consecutive = torch.where(is_timestamp[1:] & is_timestamp[:-1])[0] + if (WHIPSER_GE_20230306 or has_reached_decoding_limit()) and ( + (is_timestamp[-1] and not is_timestamp[-2]) if last_chunk_token is None else + last_chunk_token >= tokenizer.timestamp_begin and not is_timestamp[-2] + ): + consecutive = torch.cat([consecutive, torch.Tensor([len(tokens)-1]).int()]) + last_is_timestamp = True + if len(consecutive): + # Remove last tokens + is_special[consecutive[-1]+1:] = True + # Keep end timestamp + is_special[consecutive[-1]] = False + elif is_timestamp[-1]: + # Keep end timestamp + is_special[-1] = False + else: + last_is_timestamp = False + + if use_timestamps_for_alignment and len(consecutive): + # Keep all timestamps + is_special[idx_task+2:consecutive[-1]] = False + + # Do remove what has to be removed + is_next_achar = ~torch.cat([is_special[1:], torch.Tensor([False]).bool()]) + for i, weights in enumerate(segment_attweights): + assert len(weights) == len(tokens), f"{len(weights)} attention weights != {len(tokens)}" + # We must remove attention weights used to predict timestamp tokens + segment_attweights[i] = [w for s, w in zip(is_next_achar, weights) if s] + tokens_filtered = tokens[~is_special] + assert len(segment_attweights[0]) == len(tokens_filtered), f"{len(segment_attweights[0])} attention weights != {len(tokens_filtered)} " + + # Replace first and last timestamp + orig_start, orig_end = tokens_filtered[1].item(), tokens_filtered[-1].item() + tokens_filtered[1] = tokenizer.timestamp_begin # <|0.00|> + if last_is_timestamp: + tokens_filtered[-1] = tokenizer.timestamp_begin + N_FRAMES // 2 # <|30.00|> + segment_tokens[-1] = tokens_filtered.tolist() + + # Do alignement + added, unfinished_decoding, last_token_reliable = align_last_segment() + + # Re-split into segments (if necessary) + if added: + if len(consecutive) > 1: + segments_timestamped_concat = timestamped_word_segments[-1] + new_segments_timestamped = [] + new_segment_tokens = [] + start = idx_task+1 + i_word = 0 + for i, end in enumerate(consecutive): + end = end.item() + new_segment_tokens.append(tokens[start:end+1].tolist()) + if debug: + logger.debug(f"Add segment {len(timestamped_word_segments)+i}:\n\t{tokenizer.decode_with_timestamps(new_segment_tokens[-1])}") + total_length = end - start - 1 + start = end+1 + length = 0 + new_segments_timestamped.append([]) + while length < total_length: + if not use_timestamps_for_alignment and i_word == len(segments_timestamped_concat): + # This can happen in the case of "..." + assert total_length == 1 and i == len(consecutive)-1, "Unexpected situation!" + break + assert i_word < len(segments_timestamped_concat), f"i_word={i_word} < len(segments_timestamped_concat)={len(segments_timestamped_concat)}" + word = segments_timestamped_concat[i_word] + new_segments_timestamped[-1].append(word) + length += len(word["tokens_indices"]) + i_word += 1 + # This can be non zero, when a punctuation (alone in a segment) is glued to the previous segment + if use_timestamps_for_alignment: + assert length == total_length, f"length={length} != total_length={total_length}" + elif length > total_length: + delta = length - total_length + word = new_segments_timestamped[-1][-1] + word_tokindices = word["tokens_indices"] + word_tokens = word["tokens"] + word["tokens_indices"] = word_tokindices[:-delta] + word["tokens"] = word_tokens[:-delta] + word["word"] = "".join(word_tokens[:-delta]) + i_word -= 1 + t = segments_timestamped_concat[i_word]["end"] + segments_timestamped_concat[i_word] = dict( + text="".join(word_tokens[-delta:]), + start=t, end=t, # Word without timestamp + tokens=word_tokens[-delta:], + tokens_indices=word_tokindices[-delta:], + ) + + assert i_word == len(segments_timestamped_concat) + + segment_tokens = segment_tokens[:-2] + new_segment_tokens + [segment_tokens[-1]] + timestamped_word_segments = timestamped_word_segments[:-1] + new_segments_timestamped + + else: + + # Recover start and end token + segment = segment_tokens[-2] + tokenizer.decode_with_timestamps([orig_start,orig_end]) + segment[0] = orig_start + if last_is_timestamp: + segment[-1] = orig_end + + if debug: + logger.debug(f"Add segment {len(timestamped_word_segments)}:\n\t{tokenizer.decode_with_timestamps(segment)}") + + if unfinished_decoding: + timestamped_word_segments[-1][-1]["avg_logprob_reliable"] = last_token_reliable + + reset(False) + + mfcc = new_mfcc + + n_segments = len(segment_tokens)-1 + + # Get word confidence and/or check if previous segments shoud have been skipped + should_skip = False + if compute_word_confidence or no_speech_threshold is not None: + + # no voice activity check + should_skip = (no_speech_prob > no_speech_threshold) if (no_speech_threshold is not None) else False + if compute_word_confidence or (should_skip and logprob_threshold is not None): + n = len(chunk_logprobs) + if n == len(chunk_tokens_nosot): + chunk_tokens_nosot = chunk_tokens_nosot[1:] + if unfinished_decoding: + assert last_token_fallback is not None + last_tokens = [last_token_fallback] + timestamped_word_segments[-1][-1]["avg_logprob_reliable"] = last_token_reliable + n += 1 + elif has_reached_decoding_limit(): + # there were segments in the 30sec chunck, and then the LM got stuck + last_tokens = [torch.argmax(chunk_logprobs[-1]).item()] + timestamped_word_segments[-1][-1]["avg_logprob_reliable"] = (temperature == 0) + else: + last_tokens = [tokenizer.eot] + chunck_indices = chunk_tokens_nosot + last_tokens + assert len(chunk_logprobs) == len(chunck_indices), f"{len(chunk_logprobs)} != {len(chunck_indices)}" + logprobs = torch.cat([logprob[i].unsqueeze(0) for (logprob, i) in zip(chunk_logprobs, chunck_indices)]) + assert min([p.isfinite().item() for p in logprobs]), \ + f"Got infinite logprob among ({len(logprobs)}) {[(i, tokenizer.decode_with_timestamps([i]), v.item()) for (i,v) in zip(chunck_indices, logprobs)]}" + sum_logprob = sum(logprobs) + avg_logprob = sum_logprob/n + # don't skip if the logprob is high enough, whatever the no_speech_prob is + if logprob_threshold is not None and avg_logprob > logprob_threshold: + should_skip = False + + if should_skip: + logger.debug(f"Skipping last {n_segments-i_start} segments (no_speech_prob {no_speech_prob} > {no_speech_threshold} and avg_logprob {avg_logprob} < {logprob_threshold})") + index_begin_30sec_chunck -= n_segments-i_start + segment_tokens = segment_tokens[:i_start] + [segment_tokens[-1]] + timestamped_word_segments = timestamped_word_segments[:i_start] + elif compute_word_confidence: + avg_logprob = avg_logprob.item() + i_token_end = -1 + for i in range(i_start, n_segments): + tokens = segment_tokens[i] + i_token_start = i_token_end + 1 + i_token_end = i_token_start + len(tokens) + assert chunck_indices[i_token_start:i_token_end] == tokens, f"Inconsistent token list {tokenizer.decode_with_timestamps(chunck_indices[i_token_start:i_token_end])} != {tokenizer.decode_with_timestamps(tokens)}" + i_token_start += 1 # skip sos (start time) + if not unfinished_decoding or i != n_segments-1: + i_token_end -= 1 # skip eos (end time) + segment_logprobs.append(logprobs[i_token_start:i_token_end]) + segment_avglogprobs.append(avg_logprob) + else: + for i in range(i_start, n_segments): + segment_logprobs.append(None) + segment_avglogprobs.append(None) + + else: + for i in range(i_start, n_segments): + segment_logprobs.append(None) + segment_avglogprobs.append(None) + + if verbose_bugged and not should_skip: + for segment in timestamped_word_segments[i_start:]: + for word in segment: + print_timestamped(word) + + # Reset counters + chunk_tokens = [] + chunk_tokens_nosot = [] + chunk_logprobs = [] + no_speech_prob = None + + def hook_attention_weights(layer, ins, outs, index): + nonlocal segment_attweights + # In old version of whisper, output is a single tensor + assert isinstance(outs, tuple) and len(outs) == 2, "whisper seems to be outdated, please update it (pip install --upgrade --no-deps --force-reinstall git+https://github.com/openai/whisper.git)" + if not has_started: + return + w = outs[-1] + # Only the last attention weights is useful + if w.shape[-2] > 1: + w = w[:, :, -1:, :] + segment_attweights[index].append(w.cpu()) + + def hook_mfcc(layer, ins, outs): + nonlocal new_mfcc, mfcc + new_mfcc = ins[0] + if mfcc is None: + mfcc = new_mfcc + + def hook_input_tokens(layer, ins, outs): + nonlocal segment_tokens, sot_index, chunk_tokens, chunk_tokens_nosot, logit_filters, has_started, language, num_inference_steps + num_inference_steps += 1 + + curr_tokens = ins[0] + assert curr_tokens.shape[0] == 1, "Batch decoding is not supported" + curr_tokens = curr_tokens.squeeze(0) + + if is_sot(curr_tokens): + chunk_prompt = curr_tokens.tolist() + if language is None: + if len(curr_tokens) > 1: + language = tokenizer.decode(curr_tokens[-2:-1]) + language = language[2:-2] # remove trailing "<|" and "|>" + whisper_options["language"] = language + + if verbose and not whisper_options["verbose"] and len(curr_tokens) > 1: + # Reproduce whisper verbose (2/2) + print(f"Detected language: {whisper.tokenizer.LANGUAGES[language].title()}") + sys.stdout.flush() + + logit_filters = get_logit_filters(model, whisper_options, prompt = chunk_prompt[1:-len(tokenizer.sot_sequence)]) + + may_flush_segment(curr_tokens) + + # Get the index of the <|startoftranscript|> tokens (to get proba of silence later) + if is_sot(curr_tokens): + has_started = len(curr_tokens) > 1 or not model.is_multilingual + if no_speech_threshold is not None: + sot_index = curr_tokens.tolist().index(tokenizer.sot) + else: + sot_index = None + + # Keep the last token only + if has_started: + segment_tokens[-1].append(curr_tokens[-1].item()) + + # Accumulate tokens + if has_started: + chunk_tokens.append(curr_tokens) + if not is_sot(curr_tokens): + chunk_tokens_nosot.append(curr_tokens[-1].item()) + else: + if verbose and not whisper_options["verbose"]: + # Reproduce whisper verbose (1/2) + print("Detecting language using up to the first 30 seconds. Use `--language` to specify the language") + + embedding_weights = None + def hook_output_logits(layer, ins, outs): + nonlocal no_speech_prob, chunk_logprobs, segment_tokens, chunk_tokens, chunk_tokens_nosot, last_chunk_token, embedding_weights, has_started, language, language_probs + + if embedding_weights is None: + embedding_weights = torch.transpose(model.decoder.token_embedding.weight, 0, 1).to(outs[0].dtype) + + # Get the probability of silence + if sot_index is not None and no_speech_prob is None: + logits = (outs[0][sot_index,:] @ embedding_weights).float() + logits = logits.softmax(dim=-1) + no_speech_prob = logits[tokenizer.no_speech].item() + + # Get language probabilities + if language is None and sot_index is not None and model.is_multilingual: + index_start = tokenizer.sot + 1 + index_end = index_start + len(tokenizer.all_language_tokens) + logits = (outs[0][sot_index,:] @ embedding_weights).float() + language_probs = logits[index_start:index_end].softmax(dim=-1) + language_probs = dict(zip(whisper.tokenizer.LANGUAGES, language_probs.tolist())) + + # Get the log-probabilities of tokens (we don't know yet which one will be chosen) + if has_started: + logits = (outs[0][-1:,:] @ embedding_weights).float() + tokens = torch.cat(chunk_tokens).unsqueeze(0) + for logit_filter in logit_filters: + logit_filter.apply(logits, tokens) + logits = F.log_softmax(logits.squeeze(0), dim=-1) + chunk_logprobs.append(logits) + + if WHIPSER_GE_20230306 and has_reached_decoding_limit(): + last_chunk_token = torch.argmax(logits).item() + else: + last_chunk_token = None + + try: + + # Add hooks to the model, to get tokens and attention weights on the fly + all_hooks = [] + all_hooks.append(model.encoder.conv1.register_forward_hook(hook_mfcc)) + all_hooks.append(model.decoder.token_embedding.register_forward_hook(hook_input_tokens)) + nblocks = len(model.decoder.blocks) + j = 0 + for i, block in enumerate(model.decoder.blocks): + if i < nblocks - word_alignement_most_top_layers: + continue + all_hooks.append( + block.cross_attn.register_forward_hook( + lambda layer, ins, outs, index=j: hook_attention_weights(layer, ins, outs, index)) + ) + j += 1 + if compute_word_confidence or no_speech_threshold is not None: + all_hooks.append(model.decoder.ln.register_forward_hook(hook_output_logits)) + + transcription = model.transcribe(audio, **whisper_options) + + finally: + + # Remove hooks + for hook in all_hooks: + hook.remove() + + # Finalize (collect last segment) + may_flush_segment() + segment_tokens.pop(-1) + + token_special_idx = min(tokenizer.sot, tokenizer.eot) + def filter_tokens(tokens): + while len(tokens) and tokens[0] >= token_special_idx: + tokens = tokens[1:] + while len(tokens) and tokens[-1] >= token_special_idx: + tokens = tokens[:-1] + return tokens + + assert len(segment_tokens) == len(timestamped_word_segments), f"Inconsistent number of segments: tokens ({len(segment_tokens)}) != timestamped_word_segments ({len(timestamped_word_segments)})" + assert len(segment_avglogprobs) == len(segment_tokens), f"Inconsistent number of segments: avg logprobs ({len(segment_avglogprobs)}) != tokens ({len(segment_tokens)})" + assert len(segment_logprobs) == len(segment_tokens), f"Inconsistent number of segments: logprobs ({len(segment_logprobs)}) != tokens ({len(segment_tokens)})" + + whisper_segments = transcription["segments"] + l1 = len(whisper_segments) + l2 = len(timestamped_word_segments) + if l1 != l2 and l1 != 0: + logger.warning(f"Inconsistent number of segments: whisper_segments ({l1}) != timestamped_word_segments ({l2})") + assert l1 == l2 or l1 == 0, f"Inconsistent number of segments: whisper_segments ({l1}) != timestamped_word_segments ({l2})" + + logger.debug("Compile results") + words = [] + for i, (segment, timestamped_words, token, avglogprob, logprobs) in enumerate(zip(whisper_segments, timestamped_word_segments, segment_tokens, segment_avglogprobs, segment_logprobs)): + timestamped_tokens = filter_tokens(token) + whisper_tokens = filter_tokens(segment["tokens"]) + if timestamped_tokens != whisper_tokens: + if len(timestamped_tokens) == len(whisper_tokens) + 1: + logger.warning(f"An additional token was added on segment {i}") + elif WHIPSER_GE_20230306 and len(whisper_tokens) == 0: + logger.warning(f"Whisper has empty segment {i}") + assert segment["end"] == segment["start"], f"Fatal Error: Got empty segment {i} with non-zero duration" + segment["tokens"] = timestamped_tokens + segment["text"] = tokenizer.decode(timestamped_tokens) + else: + assert len(timestamped_tokens) < len(whisper_tokens) and timestamped_tokens == whisper_tokens[:len(timestamped_tokens)], \ + f"Fatal Error: Got inconsistent text for segment {i}:\n({len(timestamped_tokens)})\n{tokenizer.decode_with_timestamps(timestamped_tokens)}\n{timestamped_tokens}\n!=\n({len(whisper_tokens)})\n{tokenizer.decode_with_timestamps(whisper_tokens)}\n{whisper_tokens[:len(timestamped_tokens)]}" + segment["tokens"] = token if WHIPSER_GE_20230306 else timestamped_tokens # tokens include special timestamp tokens since 20230306 + segment["text"] = tokenizer.decode(segment["tokens"]) + logger.warning(f"Text had to be shortned on segment {i}:\n{tokenizer.decode(timestamped_tokens)}\n!=\n{tokenizer.decode(whisper_tokens)}") + timestamped_words[-1]["avg_logprob_reliable"] = False + + offset = segment["seek"] * HOP_LENGTH / SAMPLE_RATE + for timestamped_word in timestamped_words: + timestamped_word["start"] += offset + timestamped_word["end"] += offset + timestamped_word["idx_segment"] = i + + if compute_word_confidence: + if "avg_logprob_reliable" not in timestamped_words[-1] or timestamped_words[-1]["avg_logprob_reliable"]: + # assert abs(segment["avg_logprob"] - avglogprob) < 1e-2, f"Fatal Error: Got inconsistent logprob for segment {i}: {segment['avg_logprob']} != {avglogprob}" + if abs(segment["avg_logprob"] - avglogprob) >= 1e-2: + logger.warning(f"Recomputed different logprob for segment {i}: {avglogprob} != {segment['avg_logprob']}") + if include_punctuation_in_confidence: + segment["confidence"] = round_confidence(logprobs.mean().exp().item()) + else: + logprobs_nopunc = [] + i_end = 0 + for timestamped_word in timestamped_words: + i_start = i_end + tokens = timestamped_word["tokens"] + i_end += len(tokens) + + assert i_end <= len(logprobs), f"Fatal Error: Got out-of-bound index for segment {i}: {i_end} > {len(logprobs)}" + if include_punctuation_in_confidence: + word_logprobs = logprobs[i_start:i_end] + else: + while len(tokens) > 1 and len(tokens[-1]) and tokens[-1][-1] in _punctuation: # Note: look at the last character of token, to take into account "...", "!!", etc. + tokens = tokens[:-1] + word_logprobs = logprobs[i_start:i_start + len(tokens)] + logprobs_nopunc.append(word_logprobs) + + timestamped_word["confidence"] = round_confidence(word_logprobs.mean().exp().item() if len(word_logprobs) else 0.0) + + if i_end not in [len(logprobs), len(logprobs)-1]: + logger.warning(f"Got inconsistent length for segment {i} ({len(logprobs)} != {i_end}). Some words have been ignored.") + if not include_punctuation_in_confidence: + logprobs_nopunc = torch.cat(logprobs_nopunc) + segment["confidence"] = round_confidence(logprobs_nopunc.mean().exp().item()) + + words.extend(timestamped_words) + + if language_probs: + transcription["language_probs"] = language_probs + + return transcription, words + +def _transcribe_timestamped_naive( + model, + audio, + remove_punctuation_from_words, + compute_word_confidence, + include_punctuation_in_confidence, + refine_whisper_precision_nframes, + alignment_heads, + plot_word_alignment, + word_alignement_most_top_layers, + detect_disfluencies, + trust_whisper_timestamps, + min_word_duration, + **whisper_options, +): + verbose = whisper_options["verbose"] + whisper_options["verbose"] = None if whisper_options["verbose"] is True else whisper_options["verbose"] # We will print intermediate results ourselves + language = whisper_options["language"] + refine_whisper_precision_sec = refine_whisper_precision_nframes * AUDIO_TIME_PER_TOKEN + + word_alignement_most_top_layers = float("inf") if word_alignement_most_top_layers is None else word_alignement_most_top_layers + + audio = get_audio_tensor(audio) + audio_duration = audio.shape[-1] / SAMPLE_RATE + + if verbose and language is None and not whisper_options["verbose"]: + # Reproduce whisper verbose (1/2) + print("Detecting language using up to the first 30 seconds. Use `--language` to specify the language") + + tokenizer = get_tokenizer(model, task=whisper_options["task"], language=language) + + language_probs = None + def hook_output_logits(layer, ins, outs): + nonlocal language_probs, tokenizer + + # Get language probabilities + if language_probs is None: + if outs.shape[1] == 1: + embedding_weights = torch.transpose(model.decoder.token_embedding.weight, 0, 1).to(outs[0].dtype) + index_start = tokenizer.sot + 1 + index_end = index_start + len(tokenizer.all_language_tokens) + logits = (outs[0][0,:] @ embedding_weights).float() + language_probs = logits[index_start:index_end].softmax(dim=-1) + language_probs = dict(zip(whisper.tokenizer.LANGUAGES, language_probs.tolist())) + else: + language_probs = False + + all_hooks = [] + if model.is_multilingual: + all_hooks.append(model.decoder.ln.register_forward_hook(hook_output_logits)) + + try: + transcription = model.transcribe(audio, **whisper_options) + finally: + for hook in all_hooks: + hook.remove() + + if verbose and language is None and not whisper_options["verbose"]: + # Reproduce whisper verbose (2/2) + print(f"Detected language: {whisper.tokenizer.LANGUAGES[transcription['language']].title()}") + sys.stdout.flush() + + language = norm_language(transcription["language"]) + use_space = should_use_space(language) + + n_mels = model.dims.n_mels if hasattr(model.dims, "n_mels") else 80 + + attention_weights = [[] for _ in range(min(word_alignement_most_top_layers,len(model.decoder.blocks)))] + + try: + + all_hooks = [] + + # Hook the model + nblocks = len(model.decoder.blocks) + j = 0 + for i, block in enumerate(model.decoder.blocks): + if i < nblocks - word_alignement_most_top_layers: + continue + all_hooks.append( + block.cross_attn.register_forward_hook( + lambda layer, ins, outs, index=j: attention_weights.__setitem__(index, outs[-1]) + ) + ) + j += 1 + + + # When not relying on Whisper timestamps + current_tokens = [] + token_to_idx_segment = [] + + words = [] + previous_end = 0 + whisper_segments = transcription["segments"] + for i_segment, segment in enumerate(whisper_segments): + + # Note: this could also be a fix to issue #61 where a "<|te|>" token was predicted + # segment["tokens"] = [t for t in segment["tokens"] if t < tokenizer.eot or t >= tokenizer.timestamp_begin] + + start = end = tokens = None + if trust_whisper_timestamps: + + start = segment["start"] + end = segment["end"] + if end < start: + # Whisper is wrong on the prediction of segment end + end = min(audio_duration, start + SEGMENT_DURATION) + + start_margin_min = start - refine_whisper_precision_sec + start_margin_max = start + refine_whisper_precision_sec + if start >= audio_duration - min_word_duration or (previous_end >= start_margin_min and previous_end <= start_margin_max): + # Make start as accurate as possible (as the decoding will start with timestamp <|0|>) + start = previous_end + else: + # Fallback + start = start_margin_min + + if start > audio_duration - min_word_duration: + # Skip last segment if too short + logger.warning(f"Skipping segment outside of audio duration {audio_duration} (original: {segment['start']}-{segment['end']}, new: {start}-XXX)") + continue + + end_margin_min = end - refine_whisper_precision_sec + end_margin_max = end + refine_whisper_precision_sec + if i_segment < len(whisper_segments) - 1: + # Try to enforce: + # end + min_word_duration <= next start + refine_whisper_precision_sec + end_margin_max2 = whisper_segments[i_segment + 1]["start"] + refine_whisper_precision_sec - min_word_duration + if end_margin_max2 >= end_margin_min: + end_margin_max = min(end_margin_max2, end_margin_max) + end = min(audio_duration, end_margin_max) + + if end < start + min_word_duration: + logger.warning(f"Got super short segment (original from whisper: {segment['start']}-{segment['end']}, new: {start, end})") + end = min(audio_duration, start + min_word_duration) + if end <= start: + logger.warning(f"Skipping this short segment occuring too close to the end of the audio") + continue + + tokens = segment["tokens"] + + else: + + seek = segment["seek"] + new_tokens = segment["tokens"] + if not len(new_tokens): + continue + # Add timestamps that will be needed after + if new_tokens[0] < tokenizer.timestamp_begin: + relative_start = segment["start"] - (seek * HOP_LENGTH / SAMPLE_RATE) + start_token = round(relative_start * SAMPLE_RATE / AUDIO_SAMPLES_PER_TOKEN) + tokenizer.timestamp_begin + new_tokens = [start_token] + new_tokens + if new_tokens[-1] < tokenizer.timestamp_begin: + relative_end = segment["end"] - (seek * HOP_LENGTH / SAMPLE_RATE) + end_token = round(relative_end * SAMPLE_RATE / AUDIO_SAMPLES_PER_TOKEN) + tokenizer.timestamp_begin + new_tokens = new_tokens + [end_token] + + current_tokens.extend(new_tokens) + token_to_idx_segment.extend([i_segment] * len(new_tokens)) + + next_seek = whisper_segments[i_segment+1]["seek"] if i_segment < len(whisper_segments) - 1 else None + if seek != next_seek: + start = float(seek * HOP_LENGTH / SAMPLE_RATE) + assert start < audio_duration, f"Got start {start} which is outside of audio duration {audio_duration}" + end = min(start + SEGMENT_DURATION, audio_duration) + tokens = current_tokens + + if tokens is None or not len(tokens): + continue + + start_sample = min(round(start * SAMPLE_RATE), audio.shape[-1]) + end_sample = min(round(end * SAMPLE_RATE), audio.shape[-1]) + + # Extract features on the audio segment + sub_audio = audio_minimum_padding(audio[start_sample:end_sample]) + + mfcc = whisper.log_mel_spectrogram(sub_audio, n_mels).to(model.device) + mfcc = whisper.pad_or_trim(mfcc, N_FRAMES) + mfcc = mfcc.unsqueeze(0) + + segment_tokens_check = [] + if tokens[0] >= tokenizer.timestamp_begin: + segment_tokens_check.append(tokens[0]) + while tokens[0] >= tokenizer.timestamp_begin: + tokens = tokens[1:] + assert len(tokens), "Got transcription with only timestamps!" + last_token_check = None + while tokens[-1] >= tokenizer.timestamp_begin: + last_token_check = tokens[-1] + tokens = tokens[:-1] + + tokens = [ + *tokenizer.sot_sequence, + tokenizer.timestamp_begin, + ] + tokens + + i_start = len(tokenizer.sot_sequence) + + with torch.no_grad(): + logprobs = model(mfcc, torch.Tensor(tokens).int().to(model.device).unsqueeze(0)) + logprobs = F.log_softmax(logprobs, dim=-1) + + end_token = tokenizer.timestamp_begin + round(min(N_FRAMES * HOP_LENGTH, end_sample - start_sample) // AUDIO_SAMPLES_PER_TOKEN) + tokens = tokens[i_start:] + [end_token] + attention_weights = [w[:, :, i_start-1:, :] for w in attention_weights] + + ws = perform_word_alignment( + tokens, + attention_weights, + tokenizer, + use_space=use_space, + alignment_heads=alignment_heads, + remove_punctuation_from_words=remove_punctuation_from_words, + refine_whisper_precision_nframes=refine_whisper_precision_nframes, + detect_disfluencies=detect_disfluencies, + mfcc=mfcc, + plot=plot_word_alignment, + ) + + segment_logprobs = [] + i_token = 1 + + for word in ws: + + word["start"] = round(word["start"] + start, 2) + word["end"] = round(word["end"] + start, 2) + + if trust_whisper_timestamps: + word.update({"idx_segment": i_segment}) + else: + assert i_token < len(tokens) + assert not len(word["tokens_indices"]) or word["tokens_indices"][0] == tokens[i_token] + word.update({"idx_segment": token_to_idx_segment[i_token]}) + i_token += len(word["tokens"]) + while i_token < len(tokens) and tokens[i_token] >= tokenizer.timestamp_begin: + i_token += 1 + + tok_indices = word["tokens_indices"] + segment_tokens_check.extend(tok_indices) + + if compute_word_confidence: + tok = word["tokens"] + i_end = i_start + len(tok) + if include_punctuation_in_confidence: + while len(tok) > 1 and len(tok[-1]) and tok[-1][-1] in _punctuation: # Note: look at the last character of token, to take into account "...", "!!", etc. + tok = tok[:-1] + tok_indices = tok_indices[:-1] + word_logprobs = [logprobs[:, step, tok] for (step, tok) in zip(range(i_start, i_start + len(tok_indices)), tok_indices)] + i_start = i_end + if len(word_logprobs): + word_logprobs = torch.cat(word_logprobs) + segment_logprobs.append(word_logprobs) + word_confidence = word_logprobs.mean().exp().item() + else: + word_confidence = 0 + word.update({"confidence": round_confidence(word_confidence)}) + + words.append(word) + + if verbose: + print_timestamped(word) + + if last_token_check is not None: + segment_tokens_check.append(last_token_check) + if trust_whisper_timestamps: + if segment_tokens_check != segment["tokens"]: + assert len(segment_tokens_check) < len(segment["tokens"]) and segment_tokens_check[:-1] == segment["tokens"][:len(segment_tokens_check)-1], \ + f"Got inconsistent tokens: {tokenizer.decode(segment_tokens_check)} != {tokenizer.decode(segment['tokens'])}" + segment["tokens"] = segment_tokens_check + segment["text"] = tokenizer.decode(segment["tokens"]) + # else: TODO + + if len(segment_logprobs): + segment.update({"confidence": round_confidence(torch.cat(segment_logprobs).mean().exp().item())}) + + if len(ws): + previous_end = ws[-1]["end"] + + if not trust_whisper_timestamps: + current_tokens = [] + token_to_idx_segment = [] + + finally: + + # Remove hooks + for hook in all_hooks: + hook.remove() + + if language_probs: + transcription["language_probs"] = language_probs + + return (transcription, words) + +def get_audio_tensor(audio, device="cpu"): + if isinstance(audio, str): + audio = whisper.load_audio(audio) + if isinstance(audio, np.ndarray): + audio = torch.Tensor(audio) + else: + assert isinstance(audio, torch.Tensor), f"Got unexpected audio of type {type(audio)}" + return audio.to(device) + +def audio_minimum_padding(audio): + if audio.shape[-1] <= 200: + return whisper.pad_or_trim(audio, 201) + return audio + + +def should_use_space(language): + return norm_language(language) not in ["zh", "ja", "th", "lo", "my", "yue"] + +def norm_language(language): + if language is None: + return "en" + return whisper.tokenizer.TO_LANGUAGE_CODE.get(language.lower(), language) + +def print_timestamped(w): + line = f"[{format_timestamp(w['start'])} --> {format_timestamp(w['end'])}] {w['text']}\n" + # compared to just `print(line)`, this replaces any character not representable using + # the system default encoding with an '?', avoiding UnicodeEncodeError. + sys.stdout.write(line.encode(sys.getdefaultencoding(), errors="replace").decode()) + sys.stdout.flush() + + +def get_logit_filters(model, whisper_options, prompt = None): + decoding_options = get_decoding_options(whisper_options) + if "initial_prompt" in decoding_options: + prompt0 = decoding_options.pop("initial_prompt") + if prompt is None: + prompt = prompt0 + if prompt is not None: + decoding_options["prompt"] = prompt + decoding_options = whisper.DecodingOptions( + without_timestamps=False, + max_initial_timestamp=1.0, + prefix=None, + suppress_blank=True, + **decoding_options + ) + + # This performs some checks on the options + decoding_task = whisper.decoding.DecodingTask(model, decoding_options) + return decoding_task.logit_filters + +def get_decoding_options(whisper_options): + return dict([(k,v) for (k,v) in whisper_options.items() + if k not in [ + "no_speech_threshold", + "logprob_threshold", + "compression_ratio_threshold", + "condition_on_previous_text", + "verbose", + ] + ]) + +def get_tokenizer(model, task="transcribe", language="en"): + try: + return whisper.tokenizer.get_tokenizer( + model.is_multilingual, + num_languages=model.num_languages if hasattr(model, "num_languages") else 99, + task=task, language=language + ) + except TypeError: # Old openai-whisper version + return whisper.tokenizer.get_tokenizer( + model.is_multilingual, + task=task, language=language + ) + +def perform_word_alignment( + tokens, + attention_weights, + tokenizer, + use_space=True, + mfcc=None, + refine_whisper_precision_nframes=0, + remove_punctuation_from_words=False, + include_punctuation_in_timing=False, # Was True before 1.9 + unfinished_decoding=False, + alignment_heads=None, + medfilt_width=9, + qk_scale=1.0, + detect_disfluencies=True, + subwords_can_be_empty=True, # Was False before 1.11 + plot=False, + debug=False, +): + """ + Perform word alignment on the given tokens and attention weights. + Returns a list of (word, start_time, end_time) tuples. + + tokens: list of tokens (integers) + attention_weights: list of attention weights (torch tensors) + tokenizer: tokenizer used to tokenize the text + use_space: whether to use spaces to split the tokens into words (should be true for all languages except Japanese, Chinese, ...) + mfcc: MFCC features (used to identify padded region, and for plotting) + refine_whisper_precision_nframes: precision time + remove_punctuation_from_words: whether to remove punctuation from words + include_punctuation_in_timing: whether to include punctuation in the timing of (previous) words + unfinished_decoding: whether the decoding is unfinished (e.g. because the model is stuck) + alignment_heads: list of attention heads to use for alignment + medfilt_width: width of the median filter used to smooth the attention weights + qk_scale: scale factor applied to the attention weights + plot: whether to plot the word alignment + debug: whether to print debug information + """ + + assert len(tokens) > 1, f"Got unexpected sequence of tokens of length {len(tokens)} {tokenizer.decode_with_timestamps(tokens)}" + start_token = tokens[0] - tokenizer.timestamp_begin + end_token = tokens[-1] - tokenizer.timestamp_begin + + # Check start / end tokens + if start_token < 0: + raise RuntimeError(f"Missing start token in: {tokenizer.decode_with_timestamps(tokens)}") + if len(tokens) == 1 or end_token < 0: + # This can happens when Whisper is stucked as a Language Model + if debug: + logger.debug(f"Missing end token in {tokenizer.decode_with_timestamps(tokens)}") + end_token = N_FRAMES // 2 + if end_token == start_token and refine_whisper_precision_nframes == 0: + if debug: + logger.debug(f"Got empty segment in {tokenizer.decode_with_timestamps(tokens)}") + return [] + + # Let a minimal duration given the number of tokens (see https://github.com/linto-ai/whisper-timestamped/issues/67) + end_token = min(N_FRAMES // 2, max(end_token, start_token + len(tokens))) + + # Put some margin around the segment + if refine_whisper_precision_nframes > 0: + start_token = max(start_token - refine_whisper_precision_nframes, 0) + end_token = min(end_token + refine_whisper_precision_nframes, N_FRAMES // 2) + + if end_token <= start_token: + raise RuntimeError(f"Got segment with null or negative duration {tokenizer.decode_with_timestamps(tokens)}: {start_token} {end_token}") + + start_time = start_token * AUDIO_TIME_PER_TOKEN + # end_time = end_token * AUDIO_TIME_PER_TOKEN + + split_tokens = split_tokens_on_spaces if use_space else split_tokens_on_unicode + words, word_tokens, word_tokens_indices = split_tokens(tokens, tokenizer, remove_punctuation_from_words=remove_punctuation_from_words) + + # If the last token is a punctuation that comes after a word + # group this final punctuation with the final timestamp + # This is to avoid assigning the final punctuation to a big silence or a noise/music background coming after + num_punctuations_per_tokens = [ + 0 if len(w) == 1 or w[-1] not in _punctuation else 1 + for w in word_tokens + ] + if include_punctuation_in_timing: + num_punctuations_per_tokens[:-2]=[0]*(len(num_punctuations_per_tokens)-2) + + for i, w in enumerate(attention_weights): + assert w.shape[-2] == len(tokens), f"Attention weights have wrong shape: {w.shape[-2]} (expected {len(tokens)})." + weights = torch.cat(attention_weights) # layers * heads * tokens * frames + + num_tokens = weights.shape[-2] + num_frames = end_token - start_token + if num_tokens > num_frames: + logger.warning(f"Too much text ({num_tokens} tokens) for the given number of frames ({num_frames}) in: {tokenizer.decode_with_timestamps(tokens)}\nThe end of the text will be removed.") + return perform_word_alignment( + tokens[:num_frames-1] + [tokens[-1]], + [torch.cat([w[:, :, :num_frames-1, :], w[:, :, -1:, :]], dim=-2) + for w in attention_weights], + tokenizer, + use_space=use_space, + refine_whisper_precision_nframes=refine_whisper_precision_nframes, + medfilt_width=medfilt_width, + qk_scale=qk_scale, + alignment_heads=alignment_heads, + mfcc=mfcc, + plot=plot, + remove_punctuation_from_words=remove_punctuation_from_words, + detect_disfluencies=detect_disfluencies, + subwords_can_be_empty=subwords_can_be_empty, + unfinished_decoding=True, + debug=debug, + ) + + assert end_token <= weights.shape[-1] + assert len(tokens) == num_tokens + + weights = weights[..., start_token: end_token].cpu() # layers * heads * tokens * frames + + if alignment_heads is None: + weights = weights.reshape(-1, *weights.shape[-2:]) # N * tokens * frames + else: + weights = torch.stack([weights[l][h] for l, h in alignment_heads.indices().T]) + weights = median_filter(weights, (1, 1, medfilt_width)) + weights = torch.tensor(weights * qk_scale).softmax(dim=-1) + weights = weights.mean(axis=(0)) # average over layers and heads # tokens * frames + weights = weights / weights.norm(dim=-2, keepdim=True) # This was before the mean before 1.9 + weights = -weights.double().numpy() + worse_weight = 0 + + # Get the limit of audio duration + max_duration = None + if mfcc is not None: + max_duration = find_start_padding(mfcc) + if max_duration is not None: + max_duration = max_duration // 2 + + # Enforce the max duration + if max_duration: + if start_token >= max_duration: + logger.warning(f"Got start time outside of audio boundary") + else: + weights[:-1, max_duration:] = worse_weight + + # Encourage to start early + weights[0, 0] = weights.min() + # weights[0, refine_whisper_precision_nframes*2:] = worse_weight + + if subwords_can_be_empty: + step_pattern = dtw.stepPattern.symmetric1 + else: + # Similar as "symmetric1" but without the possibility to have the same timestamp for two tokens + step_pattern = dtw.stepPattern.StepPattern(dtw.stepPattern._c( + 1, 1, 1, -1, + 1, 0, 0, 1, + 2, 0, 1, -1, + 2, 0, 0, 1, + )) + alignment = dtw.dtw(weights, step_pattern=step_pattern) + + global num_alignment_for_plot + num_alignment_for_plot += 1 + + if plot: + import matplotlib.pyplot as plt + import matplotlib.ticker as ticker + + plot_mfcc = 1 if mfcc is not None else 0 + plot_disfluencies = 1 if detect_disfluencies else 0 + nplots = (1 + plot_mfcc + plot_disfluencies) + + plt.subplots(nplots, 1, figsize=(16, 9), gridspec_kw={'height_ratios': [3] + [1] * (nplots - 1)}) + plt.subplot(nplots, 1, 1, frameon=False) + + plt.imshow(-weights, aspect="auto") + plt.plot(alignment.index2s, alignment.index1s, color="red") + + xticks = np.arange(0, weights.shape[1], 1 / AUDIO_TIME_PER_TOKEN) + xticklabels = [round_timestamp(x) for x in xticks * AUDIO_TIME_PER_TOKEN + start_time] + + ylims = plt.gca().get_ylim() + + ax = plt.gca() + ax.tick_params('both', length=0, width=0, which='minor', pad=6) + + ax.yaxis.set_ticks_position("left") + ax.yaxis.set_label_position("left") + ax.invert_yaxis() + ax.set_ylim(ylims) + + major_ticks = [-0.5] + minor_ticks = [] + current_y = 0 + + for word, word_token in zip(words, word_tokens): + minor_ticks.append(current_y + len(word_token) / 2 - 0.5) + current_y += len(word_token) + major_ticks.append(current_y - 0.5) + + words_with_subwords = ["|".join(s).strip() for (w, s) in zip(words, word_tokens)] + + ax.yaxis.set_minor_locator(ticker.FixedLocator(minor_ticks)) + ax.yaxis.set_minor_formatter( + ticker.FixedFormatter(words_with_subwords)) + ax.set_yticks(major_ticks) + ax.yaxis.set_major_formatter(ticker.NullFormatter()) + for y in major_ticks: + plt.axhline(y, color="black", linestyle="dashed") + + plt.ylabel("Words") + + if plot_mfcc: + plt.xticks(xticks) + plt.setp(plt.gca().get_xticklabels(), visible=False) + + xticks *= 2 + + plt.subplot(nplots, 1, 2, frameon=False) + plt.imshow(mfcc[0, :, start_token * 2: end_token * 2].cpu(), aspect="auto", origin="lower") + plt.yticks([]) + plt.ylabel("MFCC") + + plt.xticks(xticks, xticklabels) + plt.xlabel("Time (s)") + + jumps = np.diff(alignment.index1s) + jumps = np.pad(jumps, (1, 0), constant_values=1) + jumps = jumps.astype(bool) + jumps = alignment.index2s[jumps] + jumps = np.pad(jumps, (0, 1), constant_values=alignment.index2s[-1]) + + jumps_start = jumps + disfluences = {} + if detect_disfluencies: + jumps_start = copy.copy(jumps) + + for (i_token, (tok, begin, end)) in enumerate(zip(tokens, jumps[:-1], jumps[1:])): + + # Find local maxima in the portion of attention weights + attention_weights = -weights[i_token, begin:end] + peaks, properties = find_peaks(attention_weights, + width=3, + prominence=0.02, + ) + # If more than + if len(peaks) > 1: + if "left_ips" in properties: + left = [round(x) for x in properties["left_ips"]] + else: + left = properties["left_bases"] + + new_begin = left[-1] + begin + + jumps_start[i_token] = new_begin + + if new_begin != begin: + is_punctuation = tokenizer.decode_with_timestamps([tok]) in _punctuation + if not is_punctuation: + disfluences[i_token] = (begin, jumps_start[i_token]) + else: + disfluences[i_token+1] = (begin, end) + + if plot: + plt.subplot(nplots, 1, 2 + plot_mfcc, frameon=False) + plt.plot(range(begin,end), attention_weights) + plt.xlim(0, end) + + for i, p in enumerate(peaks): + color = 'red' if (len(peaks)>1 and i1 else 'green' + barxxy(begin+properties["left_bases"], begin+properties["right_bases"], properties.get("prominences",[1]*len(properties["left_bases"])), alpha=0.5, + # put a line with a custom color + linewidth=1, edgecolor=color + ) + if "left_ips" in properties: + for left in properties["left_ips"]: + plt.vlines(begin+left, 0, 0.5, color='green', linestyle=':') + for right in properties["right_ips"]: + plt.vlines(begin+right, 0, 0.5, color='red', linestyle=':') + + + # display the word-level timestamps in a table + word_boundaries = np.cumsum([len(t) for t in word_tokens]) + word_boundaries = np.pad(word_boundaries, (1, 0)) + begin_times = jumps_start[word_boundaries[:-1]] + end_times = jumps[word_boundaries[1:] - num_punctuations_per_tokens] + + begin_times = begin_times * AUDIO_TIME_PER_TOKEN + end_times = end_times * AUDIO_TIME_PER_TOKEN + + if detect_disfluencies: + to_be_added = [] + i_start = 0 + for i_word, toks in enumerate(word_tokens[:-1]): + i_end = i_start + len(toks) + if i_start in disfluences and i_word > 0: + begin, end = disfluences[i_start] + begin *= AUDIO_TIME_PER_TOKEN + end *= AUDIO_TIME_PER_TOKEN + to_be_added.append((i_word, begin, end)) + i_start = i_end + # Add from the end to avoid messing up the indices + for (i_word, begin, end) in to_be_added[-1::-1]: + words.insert(i_word, DISFLUENCY_MARK) + word_tokens.insert(i_word, []) + word_tokens_indices.insert(i_word, []) + begin_times = np.insert(begin_times, i_word, begin) + end_times = np.insert(end_times, i_word, end) + + # Ignore start / end tokens + if not refine_whisper_precision_nframes: + begin_times[1] = begin_times[0] + if not refine_whisper_precision_nframes: + end_times[-2] = end_times[-1] + if unfinished_decoding: + words = words[1:] + word_tokens = word_tokens[1:] + word_tokens_indices = word_tokens_indices[1:] + begin_times = begin_times[1:] + end_times = end_times[1:] + else: + words = words[1:-1] + word_tokens = word_tokens[1:-1] + word_tokens_indices = word_tokens_indices[1:-1] + begin_times = begin_times[1:-1] + end_times = end_times[1:-1] + + if plot: + ymin = 1 + + plt.subplot(nplots, 1, 1) + for i, (w, ws, begin, end) in enumerate(zip(words, word_tokens, begin_times, end_times)): + ymax = ymin + len(ws) + if mfcc is None: + plt.text(begin / AUDIO_TIME_PER_TOKEN, num_tokens-0.5, w, ha="left", va="top", color="red") + for x in [begin, end,]: + plt.axvline(x / AUDIO_TIME_PER_TOKEN, color="red", linestyle="dotted", + ymin=1-ymin/num_tokens, + ymax=0, # 1-ymax/num_tokens, + ) + ymin = ymax + + if plot_mfcc: + plt.subplot(nplots, 1, 2) + for i, (w, begin, end) in enumerate(zip(words, begin_times, end_times)): + plt.text(begin * 2 / AUDIO_TIME_PER_TOKEN, mfcc.shape[-2]*1.05, w, ha="left", va="bottom", color="red") + for x in [begin, end,]: + plt.axvline(x * 2 / AUDIO_TIME_PER_TOKEN, color="red", linestyle="dotted") + + if isinstance(plot, str): + plt.savefig(f"{plot}.alignment{num_alignment_for_plot:03d}.jpg", bbox_inches='tight', pad_inches=0) + else: + plt.show() + + return [ + dict( + text=word, + start=round_timestamp(begin + start_time), + end=round_timestamp(end + start_time), + tokens=tokens, + tokens_indices=tokens_indices, + ) + for word, begin, end, tokens, tokens_indices in zip(words, begin_times, end_times, word_tokens, word_tokens_indices) + if not word.startswith("<|") + ] + +def find_start_padding(mfcc): + """ Return start of padding given the mfcc, or None if there is no padding """ + last_mfcc = mfcc[0, :, -1] + if torch.min(last_mfcc) == torch.max(last_mfcc) == 0: + candidate_index = mfcc.shape[-1] - 2 + while candidate_index > 0: + candidate = mfcc[0, :, candidate_index] + if not torch.equal(candidate, last_mfcc): + return candidate_index + 1 + candidate_index -= 1 + return 0 # WTF!? + +def round_confidence(x): + return round(x, 3) + +def round_timestamp(x): + return round(x, 2) + +_punctuation = "".join(c for c in string.punctuation if c not in ["-", "'"]) + "。,!?:”、…" + +def split_tokens_on_unicode(tokens: list, tokenizer, remove_punctuation_from_words=False, isolate_punctuations=False): + words = [] + word_tokens = [] + word_tokens_indices = [] + current_tokens = [] + + for token in tokens: + current_tokens.append(token) + decoded = tokenizer.decode_with_timestamps([t for t in current_tokens if t < tokenizer.eot or t >= tokenizer.timestamp_begin]) + if "\ufffd" not in decoded: + empty_tokens = [""] * (len(current_tokens)-1) + punctuation = not isolate_punctuations and (decoded.strip() and decoded.strip() in _punctuation) + previous_special = len(word_tokens_indices) > 0 and (word_tokens_indices[-1][-1] >= tokenizer.timestamp_begin) + if punctuation and not previous_special: + if len(words) == 0: + words = [""] + word_tokens = [[]] + if not remove_punctuation_from_words: + words[-1] += decoded + word_tokens[-1].extend(empty_tokens + [decoded]) + word_tokens_indices[-1].extend(current_tokens) + else: + words.append(decoded) + word_tokens.append(empty_tokens + [decoded]) + word_tokens_indices.append(current_tokens) + current_tokens = [] + + return words, word_tokens, word_tokens_indices + + +def split_tokens_on_spaces(tokens: torch.Tensor, tokenizer, remove_punctuation_from_words=False): + subwords, subword_tokens_list, subword_tokens_indices_list = split_tokens_on_unicode(tokens, tokenizer, remove_punctuation_from_words=remove_punctuation_from_words) + words = [] + word_tokens = [] + word_tokens_indices = [] + + for i, (subword, subword_tokens, subword_tokens_indices) in enumerate(zip(subwords, subword_tokens_list, subword_tokens_indices_list)): + special = (subword_tokens_indices[0] >= tokenizer.timestamp_begin) + previous_special = (i > 0) and (subword_tokens_indices_list[i-1][0] >= tokenizer.timestamp_begin) + next_special = (i < len(subword_tokens_indices_list)-1) and (subword_tokens_indices_list[i+1][0] >= tokenizer.timestamp_begin) + previous_space = (i > 0) and (not subwords[i-1].strip()) + is_space = not subword.strip() + with_space = subword.startswith(" ") and not is_space + punctuation = not is_space and subword.strip() in _punctuation + if special or (not previous_space and (previous_special or (with_space and not punctuation) or (is_space and not next_special))): + words.append(subword.strip()) + word_tokens.append(subword_tokens) + word_tokens_indices.append(subword_tokens_indices) + else: + words[-1] = words[-1] + subword.strip() + word_tokens[-1].extend(subword_tokens) + word_tokens_indices[-1].extend(subword_tokens_indices) + + return words, word_tokens, word_tokens_indices + +def check_vad_method(method, with_version=False): + if method in [True, "True", "true"]: + return check_vad_method("silero") # default method + elif method in [False, "False", "false"]: + return False + elif method.startswith("silero"): + version = None + if method != "silero": + assert method.startswith("silero:"), f"Got unexpected VAD method {method}" + version = method.split(":")[1] + if not version.startswith("v"): + version = "v" + version + try: + assert float(version[1:]) >= 1 + except: + raise ValueError(f"Got unexpected silero version {version} (please check https://github.com/snakers4/silero-vad/wiki/Version-history-and-Available-Models)") + if with_version: + return ("silero", version) + else: + return method + elif method == "auditok": + try: + import auditok + except ImportError: + raise ImportError("Please install auditok to use the auditok VAD (or use another VAD method)") + else: + raise ValueError(f"Got unexpected VAD method {method}") + return method + +_silero_vad_model = None +_has_onnx = None +def get_vad_segments(audio, + output_sample=False, + min_speech_duration=0.1, + min_silence_duration=0.1, + dilatation=0.5, + method="silero", + ): + """ + Get speech segments from audio using Silero VAD + parameters: + audio: torch.Tensor + audio data *in 16kHz* + output_sample: bool + if True, return start and end in samples instead of seconds + min_speech_duration: float + minimum duration (in sec) of a speech segment + min_silence_duration: float + minimum duration (in sec) of a silence segment + dilatation: float + how much (in sec) to enlarge each speech segment detected by the VAD + method: str + VAD method to use (auditok, silero, silero:v3.1) + """ + global _silero_vad_model, _silero_get_speech_ts, _has_onnx + + if method.startswith("silero"): + + version = None + _, version = check_vad_method(method, True) + # See discussion https://github.com/linto-ai/whisper-timestamped/pull/142/files#r1398326287 + need_folder_hack = version and (version < "v4") + + if _silero_vad_model is None: + # ONNX support since 3.1 in silero + if (version is None or version >= "v3.1") and (_has_onnx is not False): + onnx=True + try: + import onnxruntime + onnxruntime.set_default_logger_severity(3) # Remove warning "Removing initializer 'XXX'. It is not used by any node and should be removed from the model." + _has_onnx = True + except ImportError as err: + logger.warning(f"Please install onnxruntime to use more efficiently silero VAD") + _has_onnx = False + onnx=False + else: + onnx=False + + # Choose silero version because of problems with version 4, see https://github.com/linto-ai/whisper-timestamped/issues/74 + repo_or_dir_master = os.path.expanduser("~/.cache/torch/hub/snakers4_silero-vad_master") + repo_or_dir_specific = os.path.expanduser(f"~/.cache/torch/hub/snakers4_silero-vad_{version}") if version else repo_or_dir_master + repo_or_dir = repo_or_dir_specific + tmp_folder = None + def apply_folder_hack(): + nonlocal tmp_folder + if os.path.exists(repo_or_dir_master): + tmp_folder = repo_or_dir_master + ".tmp" + shutil.move(repo_or_dir_master, tmp_folder) + # Make a symlink to the v3.1 model, otherwise it fails + input_exists = os.path.exists(repo_or_dir_specific) + if not input_exists: + # Make dummy file for the symlink to work + os.makedirs(repo_or_dir_specific, exist_ok=True) + os.symlink(repo_or_dir_specific, repo_or_dir_master) + if not input_exists: + shutil.rmtree(repo_or_dir_specific) + + source = "local" + if not os.path.exists(repo_or_dir): + # Load specific version of silero + repo_or_dir = f"snakers4/silero-vad:{version}" if version else "snakers4/silero-vad" + source = "github" + if need_folder_hack: + apply_folder_hack() + try: + _silero_vad_model, utils = torch.hub.load(repo_or_dir=repo_or_dir, model="silero_vad", onnx=onnx, source=source) + except ImportError as err: + raise RuntimeError(f"Please install what is needed to use the silero VAD (or use another VAD method)") from err + except Exception as err: + raise RuntimeError(f"Problem when installing silero with version {version}. Check versions here: https://github.com/snakers4/silero-vad/wiki/Version-history-and-Available-Models") from err + finally: + if need_folder_hack: + if os.path.exists(repo_or_dir_master): + os.remove(repo_or_dir_master) + if tmp_folder: + shutil.move(tmp_folder, repo_or_dir_master) + assert os.path.isdir(repo_or_dir_specific), f"Unexpected situation: missing {repo_or_dir_specific}" + + _silero_get_speech_ts = utils[0] + + # Cheap normalization of the volume + audio = audio / max(0.1, audio.abs().max()) + + segments = _silero_get_speech_ts(audio, _silero_vad_model, + min_speech_duration_ms = round(min_speech_duration * 1000), + min_silence_duration_ms = round(min_silence_duration * 1000), + return_seconds = False, + ) + + elif method == "auditok": + import auditok + + # Cheap normalization of the volume + audio = audio / max(0.1, audio.abs().max()) + + data = (audio.numpy() * 32767).astype(np.int16).tobytes() + + segments = auditok.split( + data, + sampling_rate=SAMPLE_RATE, # sampling frequency in Hz + channels=1, # number of channels + sample_width=2, # number of bytes per sample + min_dur=min_speech_duration, # minimum duration of a valid audio event in seconds + max_dur=len(audio)/SAMPLE_RATE, # maximum duration of an event + max_silence=min_silence_duration, # maximum duration of tolerated continuous silence within an event + energy_threshold=50, + drop_trailing_silence=True, + ) + + segments = [{"start": s._meta.start * SAMPLE_RATE, "end": s._meta.end * SAMPLE_RATE} for s in segments] + + else: + raise ValueError(f"Got unexpected VAD method {method}") + + if dilatation > 0: + dilatation = round(dilatation * SAMPLE_RATE) + new_segments = [] + for seg in segments: + new_seg = { + "start": max(0, seg["start"] - dilatation), + "end": min(len(audio), seg["end"] + dilatation) + } + if len(new_segments) > 0 and new_segments[-1]["end"] >= new_seg["start"]: + new_segments[-1]["end"] = new_seg["end"] + else: + new_segments.append(new_seg) + segments = new_segments + + ratio = 1 if output_sample else 1 / SAMPLE_RATE + + if ratio != 1: + for seg in segments: + seg["start"] *= ratio + seg["end"] *= ratio + if output_sample: + for seg in segments: + seg["start"] = round(seg["start"]) + seg["end"] = round(seg["end"]) + return segments + +def remove_non_speech(audio, + use_sample=False, + min_speech_duration=0.1, + min_silence_duration=1, + method="silero", + plot=False, + ): + """ + Remove non-speech segments from audio (using Silero VAD), + glue the speech segments together and return the result along with + a function to convert timestamps from the new audio to the original audio + + parameters: + audio: torch.Tensor + audio data *in 16kHz* + use_sample: bool + if True, return start and end in samples instead of seconds + min_speech_duration: float + minimum duration (in sec) of a speech segment + min_silence_duration: float + minimum duration (in sec) of a silence segment + method: str + method to use to remove non-speech segments + plot: bool or str + if True, plot the result. + If a string, save the plot to the given file + """ + + segments = get_vad_segments( + audio, + output_sample=True, + min_speech_duration=min_speech_duration, + min_silence_duration=min_silence_duration, + method=method, + ) + + segments = [(seg["start"], seg["end"]) for seg in segments] + if len(segments) == 0: + segments = [(0, audio.shape[-1])] + + audio_speech = torch.cat([audio[..., s:e] for s,e in segments], dim=-1) + + if plot: + import matplotlib.pyplot as plt + plt.figure() + max_num_samples = 10000 + step = (audio.shape[-1] // max_num_samples) + 1 + times = [i*step/SAMPLE_RATE for i in range((audio.shape[-1]-1) // step + 1)] + plt.plot(times, audio[::step]) + for s, e in segments: + plt.axvspan(s/SAMPLE_RATE, e/SAMPLE_RATE, color='red', alpha=0.1) + if isinstance(plot, str): + plt.savefig(f"{plot}.VAD.jpg", bbox_inches='tight', pad_inches=0) + else: + plt.show() + + if not use_sample: + segments = [(float(s)/SAMPLE_RATE, float(e)/SAMPLE_RATE) for s,e in segments] + + return audio_speech, lambda t, t2 = None: do_convert_timestamps(segments, t, t2) + +def do_convert_timestamps(segments, t, t2 = None): + """ + Convert timestamp from audio without non-speech segments to original audio (with non-speech segments) + + parameters: + segments: list of tuple (start, end) corresponding to non-speech segments in original audio + t: timestamp to convert + t2: second timestamp to convert (optional), when the two timestamps should be in the same segment + """ + assert len(segments) + ioffset = 0 # Input offset + ooffset = 0 # Output offset + ipreviousend = 0 + result = [] + for istart, iend in segments: + ostart = ooffset + oend = ostart + (iend - istart) + ooffset = oend + ioffset += istart - ipreviousend + ipreviousend = iend + t_in = t <= oend + t2_in = t_in if t2 is None else t2 <= oend + if t_in or t2_in: + result.append([ + max(istart, min(iend, ioffset + t)), + max(istart, min(iend, ioffset + t2)) if t2 is not None else None + ]) + if t_in and t2_in: + break + if not len(result): + result.append( + [ioffset + t, ioffset + t2 if t2 is not None else None] + ) + + if len(result) > 1: + # Minimize difference between durations + result = sorted(result, key=lambda x: abs(abs(t2-t) - abs(x[1]-x[0]))) + result = result[0] + if t2 is None: + result = round(result[0], 2) + else: + result = [round(x, 2) for x in result] + return result + +def remove_last_null_duration_words(transcription, words, recompute_text=False): + """ + Remove words with null duration happening at the end of a chunk (probable Whisper hallucinations) + """ + # First group segments by audio chunk + segments_groups = {} + seek = None + current_chunk = -1 + for i, segment in enumerate(transcription["segments"]): + if segment["seek"] != seek: + current_chunk += 1 + seek = segment["seek"] + segments_groups[i] = current_chunk + + # Remove words with null duration happening at the end of a chunk + current_chunk = -1 + is_last_empty = False + to_remove = [] + for i, word in enumerate(words[::-1]): # Reverse order + i = len(words) - i - 1 + empty = (word["start"] == word["end"]) + idx_segment = word["idx_segment"] + group = segments_groups[idx_segment] + if current_chunk != group: + is_last_empty = empty + current_chunk = group + elif not empty: + is_last_empty = False + if is_last_empty: + # Remove word + to_remove.append(i) + # Shorten text of segment + full_word = "".join(word["tokens"]) + logger.debug(f"Removing word {i+1}/{len(words)} \"{full_word}\" with empty duration at the end of segment {idx_segment+1}/{len(transcription['segments'])}") + segment = transcription["segments"][idx_segment] + text = segment["text"] + if not text.endswith(full_word): # see issue #62 + if text.endswith(full_word[:-1]): + full_word = full_word[:-1] + elif text[:-1].endswith(full_word): + text = text[:-1] + else: + raise RuntimeError(f"\"{text}\" not ending with \"{full_word}\"") + text = text[:-len(full_word)] + if i > 0 and words[i-1]["idx_segment"] == idx_segment: + segment["text"] = text + else: + logger.debug(f"Removing empty segment {idx_segment}") + # Remove segment with no more words + transcription["segments"].pop(idx_segment) + for j in range(i+1, len(words)): + words[j]["idx_segment"] -= 1 + recompute_text = True + + for i in to_remove: + words.pop(i) # Warning: inplace modification + + if recompute_text: + transcription["text"] = "".join([s["text"] for s in transcription["segments"]]) + + return transcription, words + + +def ensure_increasing_positions(segments, min_duration=0): + """ + Ensure that "start" and "end" come in increasing order + """ + has_modified_backward = False + previous_end = 0 + for i, seg in enumerate(segments): + if seg["start"] < previous_end: + assert i > 0 + new_start = round_timestamp((previous_end + seg["start"]) / 2) + if new_start < segments[i-1]["start"] + min_duration: + new_start = previous_end + else: + segments[i-1]["end"] = new_start + has_modified_backward = True + seg["start"] = new_start + if seg["end"] <= seg["start"] + min_duration: + seg["end"] = seg["start"] + min_duration + previous_end = seg["end"] + if has_modified_backward: + return ensure_increasing_positions(segments, min_duration) + + previous_end = 0 + for seg in segments: + seg["start"] = round_timestamp(seg["start"]) + seg["end"] = round_timestamp(seg["end"]) + assert seg["start"] >= previous_end, f"Got segment {seg} coming before the previous finishes ({previous_end} > {seg['start']})" + assert seg["end"] >= seg["start"], f"Got segment {seg} with end < start" + previous_end = seg["end"] + + return segments + +## Some utilities for writing transcripts to files + +def flatten(list_of_lists, key = None): + for sublist in list_of_lists: + for item in sublist.get(key, []) if key else sublist: + yield item + +def remove_keys(list_of_dicts, key): + for d in list_of_dicts: + yield {k: d[k] for k in d.keys() - {key}} + + +def write_csv(transcript, file, sep = ",", text_first=True, format_timestamps=None, header=False): + writer = csv.writer(file, delimiter=sep) + if format_timestamps is None: format_timestamps = lambda x: x + if header is True: + header = ["text", "start", "end"] if text_first else ["start", "end", "text"] + if header: + writer.writerow(header) + if text_first: + writer.writerows( + [[segment["text"].strip(), format_timestamps(segment["start"]), format_timestamps(segment["end"])] for segment in transcript] + ) + else: + writer.writerows( + [[format_timestamps(segment["start"]), format_timestamps(segment["end"]), segment["text"].strip()] for segment in transcript] + ) + +# https://stackoverflow.com/questions/66588715/runtimeerror-cudnn-error-cudnn-status-not-initialized-using-pytorch +# CUDA initialization may fail on old GPU card +def force_cudnn_initialization(device=None, s=32): + if device is None: + device = get_default_device() + torch.nn.functional.conv2d(torch.zeros(s, s, s, s, device=device), torch.zeros(s, s, s, s, device=device)) + +def get_default_device(): + if torch.cuda.is_available(): + device = "cuda" + elif find_spec('torch.xpu') is not None and torch.xpu.is_available(): + device = "xpu" + else: + device = "cpu" + return device + +# base85-encoded (n_layers, n_heads) boolean arrays indicating the cross-attention heads that are +# highly correlated to the word-level timing, i.e. the alignment between audio and text tokens. +_ALIGNMENT_HEADS = { + "tiny.en": b"ABzY8J1N>@0{>%R00Bk>$p{7v037`oCl~+#00", + "tiny": b"ABzY8bu8Lr0{>%RKn9Fp%m@SkK7Kt=7ytkO", + "base.en": b"ABzY8;40c<0{>%RzzG;p*o+Vo09|#PsxSZm00", + "base": b"ABzY8KQ!870{>%RzyTQH3`Q^yNP!>##QT-?_)10{>%RpeA61k&I|OI3I$65C{;;pbCHh0B{qLQ;+}v00", + "small": b"ABzY8DmU6=0{>%Rpa?J`kvJ6qF(V^F86#Xh7JUGMK}P%R7%R7}kK1fFL7w6%<-Pf*t^=N)Qr&0RR9", + "large-v1": b"ABzY8r9j$a0{>%R7#4sLmoOs{s)o3~84-RPdcFk!JR%R7=D0pU<_bnWW*tkYAhobTNnu$jnkEkXqp)j;w1Tzk)UH3X%SZd&fFZ2fC2yj', + "large-v3": b"ABzY8gWO1E0{>%R7(9S+Kn!D~%ngiGaR?*L!iJG9p-nab0JQ=-{D1-g00", +} + +_PARAMETERS_TO_MODEL_NAME = { + 37184256 : "tiny.en", + 37184640 : "tiny", + 71825408 : "base.en", + 71825920 : "base", + 240582144 : "small.en", + 240582912 : "small", + 762320896 : "medium.en", + 762321920 : "medium", + 1541384960 : "large", + 1541570560 : "large-v3", +} + +def get_alignment_heads(model, max_top_layer=3): + if hasattr(model, "alignment_heads"): # Since version 20230306 + return model.alignment_heads + num_parameters = _get_number_of_parameters(model) + num_layers = model.dims.n_text_layer + num_heads = model.dims.n_text_head + if num_parameters not in _PARAMETERS_TO_MODEL_NAME: + logger.warning("Could not retrieve alignment heads : taking all attention heads from the top layers") + return None + model_name = _PARAMETERS_TO_MODEL_NAME[num_parameters] + if model_name == "large": + if next(model.parameters())[0,0,0] > 0: + model_name = "large-v1" + else: + model_name = "large-v2" + return _get_alignment_heads(model_name, num_layers, num_heads) + +def _get_alignment_heads(model_name, num_layers, num_heads): + dump = _ALIGNMENT_HEADS[model_name] + array = np.frombuffer(gzip.decompress(base64.b85decode(dump)), dtype=bool).copy() + mask = torch.from_numpy(array).reshape(num_layers, num_heads) + alignment_heads = mask.to_sparse() + return alignment_heads + +def _get_number_of_parameters(model): + return sum(p.numel() for p in model.parameters()) + +from typing import Optional, Union +def load_model( + name: str, + device: Optional[Union[str, torch.device]] = None, + download_root: str = None, + in_memory: bool = False, +): + extension = os.path.splitext(name)[-1] if os.path.isfile(name) else None + + if name in whisper.available_models() or extension == ".pt": + return whisper.load_model(name, device=device, download_root=download_root, in_memory=in_memory) + + # Otherwise, assume transformers + if extension in [".ckpt", ".bin"]: + model_path = name + else: + # Search for the cached file (download if necessary) + try: + import transformers + except ImportError: + raise ImportError(f"If you are trying to download a HuggingFace model with {name}, please install first the transformers library") + from transformers.utils import cached_file + + try: + model_path = cached_file(name, "pytorch_model.bin", cache_dir=download_root, use_auth_token=None, revision=None) + except Exception as e: + try: + if isinstance(e, OSError): + model_path = cached_file(name, "whisper.ckpt", cache_dir=download_root, use_auth_token=None, revision=None) + else: + raise e + except: + raise RuntimeError(f"Original error: {e}\nCould not find model {name} from HuggingFace nor local folders.") + # Load HF Model + hf_state_dict = torch.load(model_path, map_location="cpu") + + # Rename layers + for key in list(hf_state_dict.keys())[:]: + new_key = hf_to_whisper_states(key) + if new_key is None: + hf_state_dict.pop(key) + elif new_key != key: + hf_state_dict[new_key] = hf_state_dict.pop(key) + + + # Init Whisper Model and replace model weights + dims = whisper.model.ModelDimensions(**states_to_dim(hf_state_dict)) + + if "proj_out.weight" in hf_state_dict: + hf_state_dict["decoder.proj_out.weight"] = hf_state_dict.pop("proj_out.weight") + logger.warning("Using untied projection layer") + whisper_model = WhisperUntied(dims) + else: + whisper_model = whisper.model.Whisper(dims) + + whisper_model.load_state_dict(hf_state_dict) + del hf_state_dict + if hasattr(whisper_model, "alignment_heads"): + del whisper_model.alignment_heads # Will be recomputed later + whisper_model = whisper_model.to(device) + return whisper_model + +# Credit: https://github.com/openai/whisper/discussions/830 +def hf_to_whisper_states(text): + # From Speechbrain + if text == "_mel_filters": + return None + + # From PEFT + if "default" in text: + # print(f"WARNING: Ignoring {text}") + return None + if text.startswith("base_model.model."): + text = text[len("base_model.model."):] + + text = re.sub('.layers.', '.blocks.', text) + text = re.sub('.self_attn.', '.attn.', text) + text = re.sub('.q_proj.', '.query.', text) + text = re.sub('.k_proj.', '.key.', text) + text = re.sub('.v_proj.', '.value.', text) + text = re.sub('.out_proj.', '.out.', text) + text = re.sub('.fc1.', '.mlp.0.', text) + text = re.sub('.fc2.', '.mlp.2.', text) + text = re.sub('.fc3.', '.mlp.3.', text) + text = re.sub('.fc3.', '.mlp.3.', text) + text = re.sub('.encoder_attn.', '.cross_attn.', text) + text = re.sub('.cross_attn.ln.', '.cross_attn_ln.', text) + text = re.sub('.embed_positions.weight', '.positional_embedding', text) + text = re.sub('.embed_tokens.', '.token_embedding.', text) + text = re.sub('model.', '', text) + text = re.sub('attn.layer_norm.', 'attn_ln.', text) + text = re.sub('.final_layer_norm.', '.mlp_ln.', text) + text = re.sub('encoder.layer_norm.', 'encoder.ln_post.', text) + text = re.sub('decoder.layer_norm.', 'decoder.ln.', text) + return text + +def states_to_dim(state_dict): + n_audio_state = len(state_dict['encoder.ln_post.bias']) + n_text_state = len(state_dict["decoder.ln.bias"]) + return { + "n_mels": state_dict["encoder.conv1.weight"].shape[1], # 80 + "n_vocab": state_dict["decoder.token_embedding.weight"].shape[0], # 51864 / 51865 + "n_audio_ctx": state_dict["encoder.positional_embedding"].shape[0], # 1500 + "n_audio_state": n_audio_state, # 384 / 512 / 768 / 1024 / 1280 + "n_audio_head": n_audio_state // 64, # 6 / 8 / 12 / 16 / 20 + "n_audio_layer": len(set([".".join(k.split(".")[:3]) for k in state_dict.keys() if "encoder.blocks." in k])), # 4 / 6 / 12 / 24 / 32 + "n_text_ctx": state_dict["decoder.positional_embedding"].shape[0], # 448 + "n_text_state": n_text_state, # 384 / 512 / 768 / 1024 / 1280 + "n_text_head": n_text_state // 64, # 6 / 8 / 12 / 16 / 20 + "n_text_layer": len(set([".".join(k.split(".")[:3]) for k in state_dict.keys() if "decoder.blocks." in k])), # 4 / 6 / 12 / 24 / 32 + } + +class TextDecoderUntied(whisper.model.TextDecoder): + """ + Same as TextDecoder but with untied weights + """ + def __init__(self, *args, **kwargs): + import torch + super().__init__(*args, **kwargs) + + n_vocab, n_state = self.token_embedding.weight.shape + + self.proj_out = torch.nn.Linear(n_state, n_vocab, bias=False) + + def forward(self, x, xa, kv_cache = None): + offset = next(iter(kv_cache.values())).shape[1] if kv_cache else 0 + x = self.token_embedding(x) + self.positional_embedding[offset : offset + x.shape[-1]] + x = x.to(xa.dtype) + + for block in self.blocks: + x = block(x, xa, mask=self.mask, kv_cache=kv_cache) + + x = self.ln(x) + + # logits = self.proj_out(x).float() + # logits = (x @ torch.transpose(self.proj_out.weight.to(x.dtype), 0, 1)).float() + logits = self.proj_out.to(x.dtype)(x).float() + + return logits + +class WhisperUntied(whisper.model.Whisper): + def __init__(self, *args, **kwargs): + super().__init__(*args, **kwargs) + self.decoder = TextDecoderUntied( + self.dims.n_vocab, + self.dims.n_text_ctx, + self.dims.n_text_state, + self.dims.n_text_head, + self.dims.n_text_layer, + ) + +def cli(): + + import os + import sys + import argparse + import json + + from whisper.utils import str2bool, optional_float, optional_int + + try: + # Old whisper version # Before https://github.com/openai/whisper/commit/da600abd2b296a5450770b872c3765d0a5a5c769 + from whisper.utils import write_txt, write_srt, write_vtt + write_tsv = lambda transcript, file: write_csv(transcript, file, sep="\t", header=True, text_first=False, format_timestamps=lambda x: round(1000 * x)) + + except ImportError: + # New whisper version + from whisper.utils import get_writer + + def do_write(transcript, file, output_format): + writer = get_writer(output_format, os.path.curdir) + try: + return writer.write_result({"segments": transcript}, file) + except TypeError: + # Version > 20230314 + return writer.write_result({"segments": list(transcript)}, file, { + "highlight_words": False, + "max_line_width": None, + "max_line_count": None, + }) + def get_do_write(output_format): + return lambda transcript, file: do_write(transcript, file, output_format) + + write_txt = get_do_write("txt") + write_srt = get_do_write("srt") + write_vtt = get_do_write("vtt") + write_tsv = get_do_write("tsv") + + parser = argparse.ArgumentParser( + description='Transcribe a single audio with whisper and compute word timestamps', + formatter_class=argparse.ArgumentDefaultsHelpFormatter + ) + parser.add_argument('-v', '--version', help="show version and exit", action='version', version=f'{__version__}') + parser.add_argument('--versions', help="show versions (of whisper-timestamped and whisper) and exit", action='version', + version=f'{__version__} -- Whisper {whisper.__version__} in {os.path.realpath(os.path.dirname(whisper.__file__))}') + + parser.add_argument('audio', help="audio file(s) to transcribe", nargs='+') + parser.add_argument('--model', help=f"name of the Whisper model to use. Examples: {', '.join(whisper.available_models())}", default="small") + parser.add_argument("--model_dir", default=None, help="the path to save model files; uses ~/.cache/whisper by default", type=str) + parser.add_argument("--device", default=get_default_device(), help="device to use for PyTorch inference") + parser.add_argument("--output_dir", "-o", default=None, help="directory to save the outputs", type=str) + valid_formats = ["txt", "vtt", "srt", "tsv", "csv", "json"] + def str2output_formats(string): + if string == "all": + return valid_formats + formats = string.split(",") + for format in formats: + if format not in valid_formats: + raise ValueError(f"Expected one of {valid_formats}, got {format}") + return formats + parser.add_argument("--output_format", "-f", default="all", help=f"Format(s) of the output file(s). Possible formats are: {', '.join(valid_formats)}. Several formats can be specified by using commas (ex: \"json,vtt,srt\"). By default (\"all\"), all available formats will be produced", type=str2output_formats) + + parser.add_argument("--task", default="transcribe", help="whether to perform X->X speech recognition ('transcribe') or X->English translation ('translate')", choices=["transcribe", "translate"], type=str) + parser.add_argument('--language', help=f"language spoken in the audio, specify None to perform language detection.", choices=sorted(whisper.tokenizer.LANGUAGES.keys()) + sorted([k.title() for k in whisper.tokenizer.TO_LANGUAGE_CODE.keys()]), default=None) + # f"{', '.join(sorted(k+'('+v+')' for k,v in whisper.tokenizer.LANGUAGES.items()))} + + parser.add_argument('--vad', default=False, help="whether to run Voice Activity Detection (VAD) to remove non-speech segment before applying Whisper model (removes hallucinations). Can be: True, False, silero, silero:3.1 (or another version), or autitok. Some additional libraries might be needed") + parser.add_argument('--detect_disfluencies', default=False, help="whether to try to detect disfluencies, marking them as special words [*]", type=str2bool) + parser.add_argument('--recompute_all_timestamps', default=not TRUST_WHISPER_TIMESTAMP_BY_DEFAULT, help="Do not rely at all on Whisper timestamps (Experimental option: did not bring any improvement, but could be useful in cases where Whipser segment timestamp are wrong by more than 0.5 seconds)", type=str2bool) + parser.add_argument("--punctuations_with_words", default=True, help="whether to include punctuations in the words", type=str2bool) + + parser.add_argument("--temperature", default=0.0, help="temperature to use for sampling", type=float) + parser.add_argument("--best_of", type=optional_int, default=None if USE_EFFICIENT_BY_DEFAULT else 5, help="number of candidates when sampling with non-zero temperature") + parser.add_argument("--beam_size", type=optional_int, default=None if USE_EFFICIENT_BY_DEFAULT else 5, help="number of beams in beam search, only applicable when temperature is zero") + parser.add_argument("--patience", type=float, default=None, help="optional patience value to use in beam decoding, as in https://arxiv.org/abs/2204.05424, the default (1.0) is equivalent to conventional beam search") + parser.add_argument("--length_penalty", type=float, default=None, help="optional token length penalty coefficient (alpha) as in https://arxiv.org/abs/1609.08144, uses simple length normalization by default") + + parser.add_argument("--suppress_tokens", default="-1", help="comma-separated list of token ids to suppress during sampling; '-1' will suppress most special characters except common punctuations", type=str) + parser.add_argument("--initial_prompt", default=None, help="optional text to provide as a prompt for the first window.", type=str) + parser.add_argument("--condition_on_previous_text", default=True, help="if True, provide the previous output of the model as a prompt for the next window; disabling may make the text inconsistent across windows, but the model becomes less prone to getting stuck in a failure loop", type=str2bool) + parser.add_argument("--fp16", default=None, help="whether to perform inference in fp16; Automatic by default (True if GPU available, False otherwise)", type=str2bool) + + parser.add_argument("--temperature_increment_on_fallback", default=0.0 if USE_EFFICIENT_BY_DEFAULT else 0.2, help="temperature to increase when falling back when the decoding fails to meet either of the thresholds below", type=optional_float) + parser.add_argument("--compression_ratio_threshold", default=2.4, help="if the gzip compression ratio is higher than this value, treat the decoding as failed", type=optional_float) + parser.add_argument("--logprob_threshold", default=-1.0, help="if the average log probability is lower than this value, treat the decoding as failed", type=optional_float) + parser.add_argument("--no_speech_threshold", default=0.6, help="if the probability of the <|nospeech|> token is higher than this value AND the decoding has failed due to `logprob_threshold`, consider the segment as silence", type=optional_float) + parser.add_argument("--threads", default=0, help="number of threads used by torch for CPU inference; supercedes MKL_NUM_THREADS/OMP_NUM_THREADS", type=optional_int) + + parser.add_argument("--compute_confidence", default=True, help="whether to compute confidence scores for words", type=str2bool) + parser.add_argument("--verbose", type=str2bool, default=False, help="whether to print out the progress and debug messages of Whisper") + parser.add_argument('--plot', help="plot word alignments (save the figures if an --output_dir is specified, otherwhise just show figures that have to be closed to continue)", default=False, action="store_true") + parser.add_argument('--debug', help="print some debug information about word alignement", default=False, action="store_true") + + class ActionSetAccurate(argparse.Action): + def __init__(self, option_strings, dest, nargs=None, **kwargs): + assert nargs is None + super().__init__(option_strings, dest, nargs=0, **kwargs) + def __call__(self, parser, namespace, values, option_string=None): + setattr(namespace, "best_of", 5) + setattr(namespace, "beam_size", 5) + setattr(namespace, "temperature_increment_on_fallback", 0.2) + parser.add_argument('--accurate', help="Shortcut to use the same default option as in Whisper (best_of=5, beam_search=5, temperature_increment_on_fallback=0.2)", action=ActionSetAccurate) + + class ActionSetEfficient(argparse.Action): + def __init__(self, option_strings, dest, nargs=None, **kwargs): + assert nargs is None + super().__init__(option_strings, dest, nargs=0, **kwargs) + def __call__(self, parser, namespace, values, option_string=None): + setattr(namespace, "best_of", None) + setattr(namespace, "beam_size", None) + setattr(namespace, "temperature_increment_on_fallback", None) + parser.add_argument('--efficient', help="Shortcut to disable beam size and options that requires to sample several times, for an efficient decoding", action=ActionSetEfficient) + + parser.add_argument('--naive', help="use naive approach, doing inference twice (once to get the transcription, once to get word timestamps and confidence scores).", default=False, action="store_true") + + args = parser.parse_args().__dict__ + args.pop("accurate") + args.pop("efficient") + + temperature = args.pop("temperature") + temperature_increment_on_fallback = args.pop("temperature_increment_on_fallback") + if temperature_increment_on_fallback: + temperature = tuple(np.arange(temperature, 1.0 + 1e-6, temperature_increment_on_fallback)) + else: + temperature = [temperature] + + threads = args.pop("threads") + if threads: + torch.set_num_threads(threads) + + audio_files = args.pop("audio") + + model = args.pop("model") + device = args.pop("device") + model_dir = args.pop("model_dir") + + if device.lower().startswith("cuda"): + force_cudnn_initialization(device) + + output_format = args.pop("output_format") + + model = load_model(model, device=device, download_root=model_dir) + + plot_word_alignment = args.pop("plot") + + debug = args.pop("debug") + logging.basicConfig() + if debug: + logger.setLevel(logging.DEBUG) + # This supposes to plug a logger with name "WHISPER" into Whisper source code (no harm if it's not set) + logging.getLogger("WHISPER").setLevel(logging.DEBUG) + + output_dir = args.pop("output_dir") + if output_dir and not os.path.isdir(output_dir): + os.makedirs(output_dir) + + args["naive_approach"] = args.pop("naive") + args["remove_punctuation_from_words"] = not args.pop("punctuations_with_words") + args["compute_word_confidence"] = args.pop("compute_confidence") + args["trust_whisper_timestamps"] = not args.pop("recompute_all_timestamps") + + for audio_path in audio_files: + + outname = os.path.join(output_dir, os.path.basename(audio_path)) if output_dir else None + + result = transcribe_timestamped( + model, audio_path, + temperature=temperature, + plot_word_alignment=outname if (outname and plot_word_alignment) else plot_word_alignment, + **args + ) + + if output_dir: + + if "json" in output_format: + # save JSON + with open(outname + ".words.json", "w", encoding="utf-8") as js: + json.dump(result, js, indent=2, ensure_ascii=False) + + # save TXT + if "txt" in output_format: + with open(outname + ".txt", "w", encoding="utf-8") as txt: + write_txt(result["segments"], file=txt) + + # save VTT + if "vtt" in output_format: + with open(outname + ".vtt", "w", encoding="utf-8") as vtt: + write_vtt(remove_keys(result["segments"], "words"), file=vtt) + with open(outname + ".words.vtt", "w", encoding="utf-8") as vtt: + write_vtt(flatten(result["segments"], "words"), file=vtt) + + # save SRT + if "srt" in output_format: + with open(outname + ".srt", "w", encoding="utf-8") as srt: + write_srt(remove_keys(result["segments"], "words"), file=srt) + with open(outname + ".words.srt", "w", encoding="utf-8") as srt: + write_srt(flatten(result["segments"], "words"), file=srt) + + # save CSV + if "csv" in output_format: + with open(outname + ".csv", "w", encoding="utf-8") as csv: + write_csv(result["segments"], file=csv) + with open(outname + ".words.csv", "w", encoding="utf-8") as csv: + write_csv(flatten(result["segments"], "words"), file=csv) + + # save TSV + if "tsv" in output_format: + with open(outname + ".tsv", "w", encoding="utf-8") as csv: + write_tsv(result["segments"], file=csv) + with open(outname + ".words.tsv", "w", encoding="utf-8") as csv: + write_tsv(flatten(result["segments"], "words"), file=csv) + + elif not args["verbose"]: + + json.dump(filtered_keys(result), sys.stdout, indent=2, ensure_ascii=False) + + +def filtered_keys(result, keys = [ + "text", + "segments", "words", + "language", + "start", + "end", + "confidence", + "language_probs", +]): + if isinstance(result, dict): + return {k: (filtered_keys(v, keys) if k not in ["language_probs"] else v) for k, v in result.items() if k in keys} + if isinstance(result, list): + return [filtered_keys(v, keys) for v in result] + if isinstance(result, float): + return round(result, 2) + return result + + +if __name__ == "__main__": + cli() \ No newline at end of file