From beeaa74c42936d6701423da56e33f94bb79e87cb Mon Sep 17 00:00:00 2001 From: MerlynTheWizard Date: Thu, 27 Feb 2025 16:21:02 +0000 Subject: [PATCH 1/3] adds splitting audio file cookbook --- .../images/audio-split.png | Bin 0 -> 16969 bytes .../splitting-large-audio-files.mdx | 64 ++++++++++++++++++ mint.json | 5 +- 3 files changed, 68 insertions(+), 1 deletion(-) create mode 100644 guides/transcription/salad-transcription-api/images/audio-split.png create mode 100644 guides/transcription/salad-transcription-api/splitting-large-audio-files.mdx diff --git a/guides/transcription/salad-transcription-api/images/audio-split.png b/guides/transcription/salad-transcription-api/images/audio-split.png new file mode 100644 index 0000000000000000000000000000000000000000..c8acf3edf7c92ec8a83add84c31ec911cae1318b GIT binary patch literal 16969 zcmch8by!sE`Zh7bAP6%wQZpbajdX`}iHdZGNOyO4N|#88sC0LiG|~+c(%tYa_V(*2ne(>7DMu~NO};|{kxP80aD`mzhI=xqc0YgM@k1zK&U8-9khYCKMZ5U^%Kvy+GAB6(h z2sw4L5FWXx?hj)~=si&3MpC_wR@ZatceEvgXYtXnP0@H0UJ3f|vj$~Z|- z>P;7oqv!$;?OqqGJ$vJaIFsR-brgE^CS_e6@z+^e6S2=_^%xRe3pH11k$AJwq#fBPM4H>pyPbcjg7Y zS{T{u!JIA3E$w)n1t|WwgBSRIf0>yA_Qx&uW&#wd@=7olamvZ6FZZYtqC(L4-XGB3mY>V8zXQBqn(STy`D3p zr5)v;M*d|-+{n(r*3{bG)XEZeZ&y#>%E4ZMg5tiRzdnEV)5zKM-z{0%{T>!DK<4`r zW>zK^=D%zMRr&9)@+z4+8=0$#n_3uI+5v3{^04v$ar^%i{JX)wRaE_3MNXE#*Zf<_ zf7g6%XJjj8WdXEkFZj~H)(B|%t(E=n%6~8XU6G&pe&Bzbh(BlfkE_5m3qIs${%gqu zA1as9=OQ2oevuXzdF70_ll~x$^f`7XU$q7dgx*4hhA*`bN(4DIv}s{+V{(I?g2;Av zcd=)E>*`Qxs`*w=b(|_D`1lUjc4qn;J#>CnC7&7Rxw$rO?tU)%?5bS_Y2C;Z3V}e7 zM1{d%L^urO@BRCS4^x=%-R(^q_pDZtc0=v9{IAZx%Km=i@%9vZI2GYPmOVp4qG*oT zk9UarAM=RtEO7DVzZye?54k`#hCfQKn}(}XfZlm~U)nzsHaEa?MX>-ChvB^eRfh>E z%|-r0M{_7)NNJH_rw{+$sXvDzOduxwe^pdE137;w>3ld>=Y+KqCFB{#XSm>xqcEwT z+4%3dIEfOjvYhk1b7-Hl{`#zEI@9sno&lr&-h9K(7XQ(AoV-*^ULoAPOwY^WMPKy5 z5Sk3`Cs7=k@ke?IYQ|`za_sU0M7(3kP(qV58>Ab9`h!k0%e9<1g~#~X&P(16Pfc|| zu`5&SNhMumGZ`&U;^dS+BR-DGUHml^*JW8dUED*HSue({-WS#{a5lSieKd&Wae0hZ zwcuIzT41MqH1O%S>Q<=(p!?c=eFaQ^tzZ@@)ce}w?&d7{jrZaXU|erAH?dOaSmgFVWnAFmJ!eM_F{eZG7fLMw2w(I08a%R#eXPuesi{vip5;qjHI{qwF;Bm z^IY$IIgB~wjKG7CMOQe#0M#>&aov`cp#x1EaAD7+t= zT@#vi{VcoHE06IT6=ztZgkNL^zGbYMwbk=`#L1Ff0T`Sq^8(C&Z`3k+|GL#~P=LVm zaxUh*45H`qXg zguuqQ5^m?(?{9K6s`!U-f0n0rb z7GDB3k~wv5h4~M+y#|w<#fk~-vTlsaG+NBzNw`>`KhJvFXxg~=ORL(=yyAmS;vh8Y zB-oew!(PNvml=zyfamyXPZ(-9vMUXLMR3i7+k&vHa%bjjBGVT^Nw17Z)=Q#ytFI6H zG#+lzWV&PT)*lTZ*t7(ydYt_DDxfQZ8^tKf7osWF`$p5|IiFM2oFh7crnS#=5KmwO zQV-3;{u`)GBhV@%J;#q%FV*JQzq5!frid3-=jAj)7I`SdT|zkZO>Xzwu$E@5njZ1b zRE(=XCGomG=)alX!(1OAGD*|Ri4Ytwd{eal9UB@v`WRUD2?pcrVX;Ht%Lt z{WC!WNqfPfYHs}3kk?=CRM-rpIumN(TJb}LU0~)ie0s-+8`2WM@cr4SoP;R6j4)5! z(j?V_lQM#^EQd`9*g$zl!|T!N$G6|v2T1@Al{_XPLNA^A(K5&D?$-DXH&38yQPsSw zL?d(Kx&F*y`i=PET9QGeaQkJ3+iuB5td4)V+yMN?3E)xC7l0vU@jvN|(zAX^fO1Ne zsHuMzf*1+7)W<5fBeKjKCXMqR%iZG>_{8|7vJd$S_P8}*#nE~sjD}n=km&}wAz!SE zcUe%pr?LgyGEvJhnMe3s+p*!D2YlS~>rW!xD?irB+I@`fCqG?SjBU6@qInW85Qd%Y z%X#lA`yjgUBwo(CA=|YqE+o#2K1;cY+H8uCa6lOgs*(JM-PWyWG?U*@$(&(nb^|<1 zyLEe&d-mq_@4%!Pdr}Fp<$jlnzmGg&WJ-jKj%cS=PWz1^N2-=+om(j#5*}Ma;Y6{( zkRe#Kw6YYuIa)TD8mjOAX>+@5&~hCDRlpg)eZd^a^dt`V2Tg`^_Qk7Rf)zqO|D#D@ z)}oEUypG@*0v-2~nl!KGA?juEE0!-S6`kU#@Rpp{hx0hWkLb$G3&@p0KAn~yFr{zc z!fVTFCh0~oIvE_1MB|y%JFlhKZu~rZOB)Km)%JGc4G>?R0}j;)6k#KLm-s3QVXOEE zWP-0oX_&O17L0AizXl(#iF6=B!uXOCl;!N)6VL~o7FJi%I*|fAo@tDmQs2z4N#di! ziqI+Me42pmS=*s*Af%}AuQMYe5}^~enrI}xAvY40YMa$I^g(R;(POr17GY^D<8)@a zaLDVlMYUx!r=IiWy@LFV((;WjMV6C^q&?Bj&^L>y0uhoD}F-_pLpVSQU7&9 zzC6lNGz-2k)>cy8cy6bi&O2TMfjJ}?xf;?y`b`SRo+R8R;9io8CxWR=N9KjB_lJb6 z$NBHBk7_)G)bbne$bG_?YH0!IPkO42sBND}9d6}i6@7$~;n!*KSUufNCy}BVGNsoR zSOKfuMWlT1U-8WT)n55~LF_0LJHdjnoY!@4YDReNGyVl@B!s=W#(6J(dcuv`Ql+d% zsgE~js*EAUWCGlbL- zCd-f6y9o*|<69IQ^hpvY*7ZTw6vew4;g8nXI#sAz?S`DcfC>g|6y};heGOm8S^`$d zJdTI;nr=?nf41|I+a9{GK9KP};mx6fYX^RHllLGdUx^5(B_2mz(KG(q=`f)+!IP1t z4*w1NvT)$myEW^T?;>Ir^EhfMAQM;DhsdJwX8{D-EXv-yfoZYx-!Bcq)drmA23XAz zv&}Yaq}WaoP4gkB<480Cyf;yYUpA@K!c>Jaon!D`P%6K^81S4YZ@tvhZhc@% z4S3d;zLx|O`!_ao5YnPlTyyZ1meZWkS$nO%_Hhm1=B7D#@FzqBVh5rSZU{^;Pd`gS z;ku0rS4EOfTw;j5z*AAjSZTu73WJELO8*f;_Zsx_Y^Cp=!2*D#KcHyf3 zogPOHPa)Gz5gB4c*RPVTPqA9>9$8EJlW2Z(SbZ*Q42wW5WL_gLv=ygb|ShT#vyrK1>MGK>`1onLmpD_>pA>40VOXGy z^M_J+Gxth3&Usw9cvc(K=R5W=Bc)OI;bXHeP}h@Rc=w)Yf6^f8r}kR)N+db}!Hu{9 z{9!j(nCOS2z^yl_AI8`Ul#|}~W`Cz@VO(~!&~jbXAj0VE3V`VVgY&1u1dAj9=nfpr(DQ+ck;`#+}O*)t>{m~cvR zSxbJ&dJX{H);27mG*`MwRb9lgEuriEHWuAx@8Z^nPoG7-xjenvYa+h~ zn<_?q+q9#RQ9`$q+dIJ7IMIp6|MO^22&<^!R2_XL^GnV-?2Mm$JxoTOfX`B=mRr`Rjr(ZVdogWaBzs z9;y6CyG8)yN58vX7i#-bHt^UJI87aCnvYjrD)3NQ&tVCk!-NChsGH_`>)G{CC9ZP3 z?)ozXgCYAQ8>jSO=wrGWA`>HBti~zIKy}Tr(>e*mNa4`~0;iLd;e@Od{J>r+NK7-y zaA|#4_!Xb!+c2eq_mofI3+-f;SNIjCczKcp?*!EWeav4dA(~*#+j#gcIwD z-^wJ$MlKMx(l3&%IY*HRd?#8wF`KCdf9IIc9LEBJn(O^>4Xa#iT_onhqDEI;KHJr9 z6;SmC_XgW(@dEUcSDZDW#Sb-TGe1*sG0O*Gg;12XZSsT%W+m5gV&uUzin&HaA`4!L zEa}xOZO4}N2Np-j{pMuigVWx;UfUzCayvqU$qaPHawTqHyI5qDBJUiN4`P^Gmky6h zfP>!$l(wN+t0Tivh3>A)EwGyEy=IB zdLNDKDIiWqBJ~|&m{b@|o90(Y(>6LL5B4~=8_jWdhn6az0>Mj2SowLHIeRER>hqK* zgAs#zwoB@!s>)1?%_rrf3hYr_IM5SZY3#VtL1Taz;5u{zJVzi9hqKE8G1L+OrO{-W zYI4BV&~siU5U^z3!rlyz2XoYbs2|z?{Cp+K%7HVm1ZQPcB+_V8ZQx|ZW&O#PoTrm* z`j5cX3-_Q!TSdrB4kPWx5(vThO7WP<)Eu-yv-Pdc^8EH{&u)h*yCiy+fsQwW0kx(9 zxSZl-FeB;-t%@sIf)(axxPG<>VHs5+5m!^lU3>WST1lGkQ|MO2TU%q+@dWjEbaoWb zuZ=*Ug-k?TepH_qE*H$V(4!mx7LzISx5+fJGI_7(HSQjVXWf%Ze)Mhhb)*9~;wdHx zGWf%XIAK>fDQ((${kfec({1>~1FNA90v!@g0NI@@?V6wvyx>*-yb%q-BX@TO0!%YT z*$RqBo6}}RkANtz;fEwWA}P5dW@#^dq5s#)X?pXreojuJG$4FgV?A<(uQTPeFDH8d zj;3Ej{2jxDmg{CN;}3r{)DinBqr|D^e5QEZ0=b+Q(XI9)(lh~p$+^OEGe7uGse`Yt z-jcsKx(~srd2y+nh2Og1llT>jut;O^0Wn=lgI%gcWwHxuozos!hR3Ozn{iJ3-ImVX z!}4Ur@2t42+5-C@F+$H8&gRjBNF7znOj4zo=!gl~a-zMTnr_RvkDc5zLi&N?`UoWU zLm~+%exj1idzCYmvK+o7=*k_pw`Wa3cyBaWF)R;h^Q0LwA5GLP1roOcm-G@_3#A{w z;220RuY8yJCp0gYK+uw&UIW0Jg=xqJlcH58BA;P5L?gl1VrlqwQNSn6WZn(3wBelB z_a0CWK#J^Ij-5m%gaw_G;_K{1I(GdW+Ow4#vdYhfi#A@EqaWi0@)<#@)L?}r&QBhB z)BxdjM-UR|9DwYl-I$S^lLz6qQ9Zm}sYbD-qHTEPZ{4q!G?t{ay^YN~%o$y;fdmyY{mdGP2%86U~qOU*^>;B{Q8@10| z&#hxwQES-4ZNIxrCh}t;g;=A36x#V606#lA)xa zFuA8HTq!V~Lirg}^`bA^bNL<-8JMOf@a&v%bQFJQ>r;KlXo~EdyfGUs68{(p8ZcXv zwGT6~m*VBh+zh8x7=i15V6a&8eBlY{XgHnj`{n0eiixBjB-yjITr2l*tV2Ca43nol z9)6N71$YjZFnUqUzHUTR65R=bU!OjHmkrlrc{>CvTrTpuDTKPAa2UGBJjZ7p=@l6% zgB^US(`96o$!O^lfaknENI$`J&fKTI-LdjwrwBXpM%-D&TW(s~OO}eh2)i@3>;d7>2Es9?1l_>v>HNGt>TJfKZ%R^I%c1s)5^%;l^u`hjeIZp^?5!?t;$R62s z1y-1&?gHS6W%x)!BWch}BuJP0lf;Uj5>;(SJ6t7Dcr_ilTJe_8 z!mbM!lpsuGhmwOc(o5pKlY*Pj=|j*?keaHC&F|0AzSulzveoK@mB-S^lXxHp2?Mh^ zS1%HJ+rge6eM~gAhpU{6}-#MBx$+UoOmK$vQtuFO< z*mXMGbHri4MnVAC;6~@kvF97*e)=qpeyYfVNaMqPY zDR7n@##B0p0Yky{pGG4N#n*%ti3bp6=_(Mn1og1t_ueDMN_1v2vI5FT?$*Xp$Ls+x zR1MT2uch0{-V(e|Kp!o-Jn#tRs@Vs*-&6!Qopa9X?xu2JoWA#bP#}~jNMrk3N7+Fz zGPnML#p6!Yp7XNRg)S|Wx|ZrC7NjDVza683$9 zyOLFtRaDI+>{}~LvMPoiYWvAtpH7P}7^!#%It@0Ye%QqCD(#sE&$T1WrN#Q-KDOv+` zyt^mu8fk2k+mm6@YL`qoQ5aH46im0fWWme^Km3ftuhgY-cNWzFYB*`?Yx#`D^!d6r zPmnkCNql8&P4e0+gtjWS5G($OvliMS)yY;_ zGnvQ>;ZyE4ZB-O}GL5s!P5{jqTi9isr!Kk=xze1qKo^|S@_xS1MnM&iM?`Y@$)|0a z17I3_=~LdaX~crguax!H`OmQZU|?`{Pe7~ zhB4%-=NalR2oDTz8s@+!(bal?ludfXzDqc^F0~ae7Zw@(VGr`LQUj0{ zR!Ly-p|q!^QFb?BS;Sk)#e}TNJZZ#44ju^YdjE+{12?#+?s*Rc&Edn#ihSX>TG#9r ztAa5=wA6()lhFM|(q4l^%6&K6ND7Ntu!k1*u+I1*1vj-+jW@|MoboV~ zD}95V?kTMY&3Z`Rs;5x|_PnSRTqXli(G?x)tXL44DX(rMc#%hHw&!unUmfYSHnn&{ z87luQSG=(3 zR*TbiSN%#5xu>&nihvq)G9hQx;Lasa0)Hf&{gMfh;T*xE?kgzC?DaIJ7n+Lt6|6j3 ze*iApcP)ZnFcV@!w1&6F7|g2X8?C-=)4rpVfM44jH#^+nF09nO&QF4ymWm5T8ixP{ObX`LCMnaL?gGA2(IbA*kz9#vZL0J)#;h@wCuqz zqdrPFL_gW-s_dl{+d3#aWUF8nkh4deldv+GZg#RaxDSV$-nB1046!v3;Tu4%my3SN zFUv%`N9s7)GQ9(p5=xl$W&o~A$rLz91?{@8DW-7JA; zK>Rf$8kMW!L;T4_fwrw6f|TRUYpsy&{Ibm^e2SV4uyP8_i(=1K_8 zQ=4LP%g5wttU1Lr0x3T<-x&QFtYuLlaTnNl9>saPQ_IKIBn@&;+VHdO89a+?5r13~ zW?KSG}I&_uue3{#1?i;#=xAn5FWD)fQ*QHAjV=Xx{ zQ5PRntD8B7?N{r0zIM3dF_$l<6AA3sEb5tj9jk8*Q`ZHWNUvU)P1D%Zb#rVFk0@x? zUGxupbSu3)X8o7=q*0_?Hl*%(nQ{Hi%3PPv6q0i+q#aQd7%$oReM)+h{GX0}-cuQg zG@OZBFs1QNJYDgo)NSXM%aeLJz}mvpHISDU#`n=$+lI`LAbSs#l{ZXdtPCq?J6}$~tHo?(aylCl!0WF!bWCtg98wk=5T4Db2E{_W{Q)gW-zwMpv z|JZSLh>fh*>&@a!Uj)gMd|L~j1Q8X z4_MT_1vS@YyQC`xNiw8Mlo&En>u%lNwK6!1lc7Ja*`Jzf%50cPJ|J=4uc_>K^L1J? zEYa#kq!9m#^RN9UN3jgSSqm>`9e*unxO*Q7;0Na$M2sTxAE>XiH#-ZH$O_`fpX`Yj zAG|w?rMn#d5Jc8X7qDE=e=HP^>(r`LtTGtb&AZdpyw9N`j=%58s}S($2il*fXmkj| zW$OtdO-XprMH-k^0v^ba%$1`;QU3#942sIcOXL@GG&D!Jdwq$(?7m6>vo6k-)S`Jw z=9dO$&S90!hYC<%wiSu7OnhXv@unyzXb5;oI=8sjQS29TSIykS)q46T2 zID{Y>z#ve`$c1~O` z>1_0v$Ti4rB$8@N##2%e2-LS^{DV1pnRc}425m5Qa#m_%YaQ-I7#Cm`E8*#6#ZYs3 za|^K7w5rj7uJ&>gANulByELABY*dxuYr=^cJfXOjnGaB11j)nTBII=buD;8I$Z34K zWEniA6eK1$tmx5azA3MVU!F_wbS<-(j86^uzBt?(nQ zMO;(=hA8o5P*W&Msq*j7osbJr9-yfe-ac^2o=BbuIy(v7D9PvN7<6l^a6wRbE-dk7{6{`P0C)Xk& zK^8mF3mgMz^4x9E%|&Ceg83ojL+8pp=qx7wEf)E^_6Ls=Vka+%6CRLQ+V57QcZie=W+CXN zXzB?aZRC3yHRU$#(&ORjcOXwQIPCNf^zmB;&|<#0-_r;XkeR!!bNC@D({_G=kSG(v z(w<0ewto3LTKliT!4Tf~)2PUJ%Qk=tzY2+g5Ce}db#kM^kLaHMQ*J^Z6dcYegHVE@ z$cTsd?fFAC!%B03_<~n~7)00rjhnX*5K%#ZWPq(|5-LfeCuHn3sTcG!;|((^O_Hu} z@sx3@nq(6oKxqT?5*p0%MYZYnjwp`vK%J+VHl0NGsn0fmh`|@UJzu$}mi>W9mB~fD z&RqwP$g~3d1A(&&pn);21_%xM+oeNC(`foXsOK>vBp};tvhkzv&AY-TKqhief#;IR z&hRYx;{*anHGCGJrk4QTP=POZ?P^HvdE^a{O6C0y@O(@6R13i1rc~$wBArJ7;q4K2 zx?k50kfpj|9=8E*8rCfj+5nc0_+GQa0#K6sK$iVtiREYf%V`eoTcAQR*(z5gRYXwp zVvCH^`t+Xv z0u&%x=KyEi3bed1pGdlLlDL$Z3$|w54ez8v``Xlij@?GiJe>m2(c890V7p8~kJd=O z-M2ppAwtRTGu{iM?O`r}w!UFa$W2hEm*bkV zU&HW4xSH&Oi}P)6NzEsPZuMPi=8?{_M^b_sTe*#x)a-|!xBa2%2#>P_QYIC4&0l~( zZ!NlZzZLx@YZ;E&@xndbYxj7nEYtl^x)~8}8X_EovzU;0x5vfL293qHuGfyh|= zEDWXH6g4335JViRt5O!}dDL|#KySu*um?O@j(0%z#7ot@qyuR%5>4iJ;<5ug3uJYC zgbYu9yx}@@{8f-&Ngu3764!AKS~HxeJMg^Q?kck{$xN(rxM#4-OCg%OX!@z;Mljl< zrd!u)Kxn3c_fs2aMK4T!N4(1N~EKK2A!Op&kXz}Fz`2|&Q<@xu^09ukwt%1?Pm zZ}-HYISir7x2kUs$e*#R&r(*79QH9=4a;LLx_=M?5@kQ}Edq-5?L@;z!TX}A--HNXV=;FD1y(o1_%K+~d!^}t^kh&P1PWt)k@REK`Wd!rr zvMa=@a~fNgK~J2__qG`s3k2rfX_rQ@S?5#x3|V^iz1|}H3aB_JJ!9O@^+wypXnJ#v zo0gp`S7oHf(N`o_ITRtWfV&WJ-e+Y6@|YJbhrrjbHDoYMsO#tQpxiWu6bg-Yzf3@j z!#z?}&JxQ2vS0mvQ7sMA?+Vo}QB0+rB>>)zy6_Un;b3A3U0YXgWQT3@6?}zQ^Vd16 z-`(ta&A?1Xvb3|~nQ|7`p!`?cWowKS96noY&PmVq#}=tpqI?v!a*SEwF%lvVM**j4 zS%9xi165+l`FQ^%H`ZB)O+ZT9u(+BKLgLbR20Cgwi@A%e#A99 zR6ho2Jgdg=GjKADDZT*wcDOPX6=@OKW+Q;?OLDCn?ryJ^0PkjbYQC~#jMP?k*GX(e z_${a8>ZS>hpCw3$$~;18h6j=8o3hZ_ueReTVgO?`kz)7V_P@L7@_=mq6oh)w5#PY* zJT0aN+8@}^ln&gipgkb(wIc_zcz$#28kek{4@{Z(+fuC>r>Gx?L#SozkH9CsJAkpY z`trs}O3!H{Ip#O&0hqG7F!`S1LVBQj5umm&xB$s!+!k(y8)2@SjrKLHXWj2M`#%!)&{|^Xy$gZd~%+w7TZeA<}A{2&YQ3CZoM4TN8ueT-0`0wu@+Hm$9L_ zQ3X|z`*=y|&f+EaPbnwr=?KWAH<-`3@j=wHC2h1`VSokyuEAZH6gRGBLTcv@WfA`u z32qJAR@^r0ESB_G5)Zf9e)Gi2vmEE~YLhZ^%jXBwv?O;&m(EJG_+)IE$=!WmBUlDT zw=8o*x!jAFNMH0|R6Yacz;QjTOT~ykB17X38L5GX(sF<(9@f~26bKKzkFevE<*l2YT>mEcHw2xIL>Q1H88IYU+Gqzqi4DNPfg>Ta zb`;a_h6;uRtUyfGoQ?_BvkitFHaxQB!6<^R-y^20BX4i6P%+*flcKO(l67&_woK3% z?EJu!<6GC;fWhc?EKZup2LxLahqTGb)(tgA-Wp6>;4LiNOVtN}k^He2k zQ>dHSH-f@c6I6U+T{+~G9$e~~$bh_!Z%&BBNb<2MFJz``#=J~^(kM}D8_PDS>K2cf ztS+n>>U$Jy(|4;{{A2TDxWl&GHru6(ipFy3d-reUq&>B7`3!oc1yAV=W=A{VU&HI3 zxy5nZO@6e-41P9%YHj?8m6LT4nO`#ro!`0jd`*)?6Qs^f&aY{W(Hs|@eKFkkthMqL zsCwL6*dNNvJ}>9*;eKXNS+>~pwQ7EPyi9mtL$gGf0?tyx60K#r^qv=RO{hPt7o0 zZ%ks&@7<*5X=g$mTMjQ1x*2@CLd;0*zO$aDSK>HGz|O!wYjm`05fB6Acw4AOb_XIF zJ+7u%)9|B}Gw@6`32BW$ltzHfDz_&xsZ_v2@(rqsK_RFEXoV$ywY=S5Y*`aOD2;Yz zX*q8_M|fFGkrHvdJ2yjuE*LYsJ88Ce^7iR{&i6iM60Tyob1g?B6?yXGgvyR3u=F>T z-c8eb9ce&37Xa>fnoqh*=#tQ_gCcCdLQ

#n>*d`5EAK*5=_9M1?KorBh z5^I(nXJoV7VMn$?G{Y%>xYl+4z{S+4Zn}|G!MjJuskBdbS%ij0hgUv}`kXf%rQqB7k0ZeP!LuhXFM~puk|* z4}GABH_`60xMfolv^s-eph(`eQh{;+LJ$#8Be|-mCZ}o6IBj7a85ZbhA7rfS_{6j5 zjU4`LWmSq-Vfpe}&^`OCCz$O(;6-5Ng$p-ZbMTclqR#w)7H*U|TEm1np=wQmW8{#}-^Eg0fZ8^m*rqEL>q@l6 zRusgO`3Lu&Z3bK4AZHtaNTFSV+yW|>3_CGHXFyXhdjA3V!$(tHL!FQ=n+Qrm6E25C zeJP6BZ!6cH&pzLP6W6 zzktGBFGaH^R%w_Ym=A~V5%I$rKKx7il_bDb7_u>_R^BHn`Kr24Be!I(G)?(vW%+`W zUZM~?i@zL~wpDu|i`o*;gIu3vpo$GehiY}^&+L0LtRXfs*97df+mUg;P1wog5~AMP z`L)nRix{{siX;#|XgJV(pw!?;jwQOVuA!*oE6x+MOz4Mbg|V7gk!uuy=)aB|^;A5F z@gXSJC(BSjiZ1=L02TFov<66#=`3Ws@oKm7jK%^_jk1J^m zUndb)GQ&oWMasqaOIYib+&k1vX&kXl8dT5uiW|b=7t|=(dyBo^T}mIkxI0}uyj}GT zI=1?!^=E}$T{Wu12HWt7Op~q@TMVpeN+iufnk-k~ zS$=B>f?0iU`-7Jsp@KJjKiP;?)#=JiE(%EyHHSx}DL%}}xrQGh<)J$+ z%w6@Z^$%E4Ox73@dOMb5tWH_Uor}XSytASQUBb-<tk|o5%WI2UXJKS zj^@?Z8#xW?71odbpt@{E)z|*>K-bl^V9$gUBRx2zL0vB$(?8{v<}VXvT^6^;Ok{K; zL8@4YHYPr<34r+AVeADboWy;H8+Giji6;S@00gjtvUcG-m*L+0K_<}u znQ*ox*mZxgM)~J&cAkuz8h00Z*gvfkPtPn3d)EhRD?>dflt>~`rRjUDS8qaVS-(z` zW-SW;;K)p1s`~}XM6sANcD^TQuvk6n@3t7AB5q^@5)LnfT2BIb|3_}hWy!&x5-+9i z^p;ofF8C$GAGJ>yzP1y1|0j#$b4Tf|7kNb7#g!Sty=1t~j_GL6)k!VEzA$XSq(ECD z!qUj90)JpBm5q84ZkKjQiDQP-KnA9{gt(z}@hB(|43e~Nq9=bkCWSyWFbt;ycC){3 z(0>a!7;MljuX_>x2UicAQ`vKbEwjj&_V&D8@V=aa?4nOEN1VaBSi@G*YLNkgvJ3e_ zA_^sFJ-p5H2hThkTF}a<=>mrWu zOTlpgyS8=yVg=(7S1p&LkC`tAXZRbF>Wh96%9bY3H;qD-p4npubBM;mu7&+kK%<`VPz7rKy<)(I8f6bTDDvL50AjmPVPtaf?YylpQL?m?Or}+ zg1(sUBVIpWGG7g*j4ZC`77u`a>zGNW>mq+)j6xR&i;KTQVO{stW0(!Y+IJSpv}!m} zDMXGU$6;~CCjI$!fDkL#pvNTg%86pqxk4@VxlrqHG!4XpAR`?;5CexZjvfcXO_NEv zvz~0@K_J+*u<1ky<))Za%(U5q5tcd5d_0ME(iY6yDEbHlW%on}3DWnn63dnkQuZK8 z`c(ok{Eum4GKS~-O9=yL2hVBh4!YeH$9hTU33tB_Z@if3i8pDaZVh`uu9IlM1OaCY zK@jXwPW>d?-ZHy}IcY9}e!ihC^}p1bC}{xRY6(|5PcbqlS60@VxVqx~gq4a&NtBL? z3FeH+ue43Wcsh+(^1(A$GWJ?kd7iJl&AlX%<;tYm-v6R1y&ST0{d!M;NgF(oh^?>K} zW~U*SGFy)5mHl~+a01M)n(&55ST)FCH*?`oe=#4+R;o32A-v3FpwXIhjDUZ5uW zi_HuNvg;>;kA=(J)gFlYw2^5mk_8eREJpI8G@7sbOVfF8-<#S8l>BQLyGgH9lruP& zAK2R_t57#Cl&>@n($L>&Zzg2siMs56A$%I`nVGfByP+thLH(;*(Bn_pw@(5%OOYk* zUrB(Hk5gvCsMh>y2{#Z8@W(q||3qoaf>c@zUJiLIC4yK-2DLYbe6F!>tx&CytSA`F z^sLuI^c73W=&=_d6G-b6@%EJUYSorI)jAg$p=&3ET_Mzc>sHwPOuMF+P;X-HZY@V# zIM!xkEw?NuKw`pwWFDIH){}vLK`qKpmg-CqU#S4hf>#xQfXp2$=}tPf%A-9VlQi^jjbqV=cb_{!hgyuaVVO;vy2N7sAWZZZ1rR7_AJIEia z<)5#2b(xamNaUUoC(3&&DE#VKdA?8+HK`WOuhY&I68vXy{VojQ$T|ZaKW2LHV;Hfg zG}?6jODN*wqPB>>j?5ZQHXM4vd3=GDzW2+Qhk`VFRDuK~p`|~Uk4|bzpjiu|#-mRn z;`I`9V`|C|wH$QFjCtmYS0=T)PMUOyA+Tpu4@FBeSuajOi3L*Ba_{hwK^ znw)&u9_0v1aczz`b3K+T}X zGl2hg*WdgQPEiZeqSe_vSYW?1=|emaU4_mMZ=_M^po_|&Bn^KAG5@Yt;*|hFr}A%w z{+~$^7|6dlNy2->McY_$wsC}R2sh6*Thm!A{m{=yaD_9-s+ zz_?gFP3cvxM&kmGX6@*(_=f1jAAg`h!18~H<(rd)vo7E8Mum+3O8Kkpzu)m$9C)8V zX7QEWKQ#9X9T56ox@y1s!wvmC9|4$p6#~2=@V>bq>E1>CSJ@Z=@QU%tN&T4mKjb1l zVFOm_eO|KuQyDWz+7w4OWuPwy(f2dut9OAAFq{GZMWd)&Xmp))A^^&bTOKJ-w)DmFJB z&i~8}*ymCdnDWMqMD^cc+kXt_H3eXm%9@@U^uL`w2>_R{|AzQ_iz9J literal 0 HcmV?d00001 diff --git a/guides/transcription/salad-transcription-api/splitting-large-audio-files.mdx b/guides/transcription/salad-transcription-api/splitting-large-audio-files.mdx new file mode 100644 index 0000000..b19e90b --- /dev/null +++ b/guides/transcription/salad-transcription-api/splitting-large-audio-files.mdx @@ -0,0 +1,64 @@ +--- +title: 'How to Split Large Audio Files for Salad Transcription API' +--- + +## Introduction + +When using Salad Transcription API, audio files have a maximum length limit of 2.5 hours each. If you have audio files longer than this to transcribe, you will need to split these into shorter segments first. + +--- + +## Prerequisites + +Before you begin, make sure you have: + +1. **Python Installed**: Ensure you have Python 3.8 or higher. +2. **Libraries Installed**: Use the following command to install the required libraries: + ```bash + pip install pydub + ``` +3. **FFmpeg Installed**: FFmpeg is needed by pydub for processing audio: + - **Linux**: `sudo apt install ffmpeg` + - **MacOS**: `brew install ffmpeg` + - **Windows**: [Download FFmpeg](https://ffmpeg.org/download.html) and add it to your system PATH. + +--- + +## Splitting the audio files + +### 1. Create the script: + +Create a Python script named `split_audio.py` to split the audio file: + +```Python +from pydub import AudioSegment +import os + +def split_audio(file_path, output_dir, segment_length=int(2.5*60*60*1000)): ## Adjust this value if you want even shorter segments. + audio = AudioSegment.from_file(file_path) + total_length = len(audio) + os.makedirs(output_dir, exist_ok=True) + + for i in range(0, total_length, segment_length): + segment = audio[i:i+segment_length] + segment.export(os.path.join(output_dir, f"{input_file}_segment_{i//segment_length + 1}.mp3"), format="mp3") + +if __name__ == "__main__": + input_file = "path/to/file.mp3" ## Set this to the location of the file you want to split. MP3 and MP4 files are compatible, but will always convert to MP3. + output_directory = "output/directory" ## Set this to the output directory you want to use. + split_audio(input_file, output_directory) +``` +This script will split your large audio file into smaller segments of 2.5 hours maximum each and save them in the specified output directory. You can input either audio or video files, and they will convert to MP3 when splitting. Make sure to set the input, and output, directories for your files. + +### 2. Run the script: + + ```bash + python split_audio.py + ``` + +After running the script, your output directory should now contain your original audio clip split into compatible segments to transcribe with Salad Transcription API. It should look something like this: + + + +You can now use these audio files to transcribe with using [Salad Transcription API.](/guides/transcription/salad-transcription-api/transcription-quick-start) + diff --git a/mint.json b/mint.json index 9814d7d..64e81ac 100644 --- a/mint.json +++ b/mint.json @@ -454,7 +454,10 @@ }, { "group": "Cookbooks", - "pages": ["guides/transcription/salad-transcription-api/transcribe-youtube"] + "pages": [ + "guides/transcription/salad-transcription-api/transcribe-youtube", + "guides/transcription/salad-transcription-api/splitting-large-audio-files" + ] } ] }, From cce83f8cc0015325e67b532a33ce856581caa3ac Mon Sep 17 00:00:00 2001 From: MerlynTheWizard Date: Thu, 27 Feb 2025 16:24:25 +0000 Subject: [PATCH 2/3] fixes prettier fail --- .../splitting-large-audio-files.mdx | 23 +++++++++++-------- 1 file changed, 14 insertions(+), 9 deletions(-) diff --git a/guides/transcription/salad-transcription-api/splitting-large-audio-files.mdx b/guides/transcription/salad-transcription-api/splitting-large-audio-files.mdx index b19e90b..7badaad 100644 --- a/guides/transcription/salad-transcription-api/splitting-large-audio-files.mdx +++ b/guides/transcription/salad-transcription-api/splitting-large-audio-files.mdx @@ -4,7 +4,8 @@ title: 'How to Split Large Audio Files for Salad Transcription API' ## Introduction -When using Salad Transcription API, audio files have a maximum length limit of 2.5 hours each. If you have audio files longer than this to transcribe, you will need to split these into shorter segments first. +When using Salad Transcription API, audio files have a maximum length limit of 2.5 hours each. If you have audio files +longer than this to transcribe, you will need to split these into shorter segments first. --- @@ -38,7 +39,7 @@ def split_audio(file_path, output_dir, segment_length=int(2.5*60*60*1000)): ## A audio = AudioSegment.from_file(file_path) total_length = len(audio) os.makedirs(output_dir, exist_ok=True) - + for i in range(0, total_length, segment_length): segment = audio[i:i+segment_length] segment.export(os.path.join(output_dir, f"{input_file}_segment_{i//segment_length + 1}.mp3"), format="mp3") @@ -48,17 +49,21 @@ if __name__ == "__main__": output_directory = "output/directory" ## Set this to the output directory you want to use. split_audio(input_file, output_directory) ``` -This script will split your large audio file into smaller segments of 2.5 hours maximum each and save them in the specified output directory. You can input either audio or video files, and they will convert to MP3 when splitting. Make sure to set the input, and output, directories for your files. + +This script will split your large audio file into smaller segments of 2.5 hours maximum each and save them in the +specified output directory. You can input either audio or video files, and they will convert to MP3 when splitting. Make +sure to set the input, and output, directories for your files. ### 2. Run the script: - ```bash - python split_audio.py - ``` +```bash +python split_audio.py +``` -After running the script, your output directory should now contain your original audio clip split into compatible segments to transcribe with Salad Transcription API. It should look something like this: +After running the script, your output directory should now contain your original audio clip split into compatible +segments to transcribe with Salad Transcription API. It should look something like this: -You can now use these audio files to transcribe with using [Salad Transcription API.](/guides/transcription/salad-transcription-api/transcription-quick-start) - +You can now use these audio files to transcribe with using +[Salad Transcription API.](/guides/transcription/salad-transcription-api/transcription-quick-start) From cc8e6d4cff847489c2af65c1930a9a6dc01d6bd5 Mon Sep 17 00:00:00 2001 From: MerlynTheWizard Date: Fri, 28 Feb 2025 12:17:03 +0000 Subject: [PATCH 3/3] updates python code with pr comments --- .../salad-transcription-api/splitting-large-audio-files.mdx | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/guides/transcription/salad-transcription-api/splitting-large-audio-files.mdx b/guides/transcription/salad-transcription-api/splitting-large-audio-files.mdx index 7badaad..7ae938d 100644 --- a/guides/transcription/salad-transcription-api/splitting-large-audio-files.mdx +++ b/guides/transcription/salad-transcription-api/splitting-large-audio-files.mdx @@ -42,7 +42,8 @@ def split_audio(file_path, output_dir, segment_length=int(2.5*60*60*1000)): ## A for i in range(0, total_length, segment_length): segment = audio[i:i+segment_length] - segment.export(os.path.join(output_dir, f"{input_file}_segment_{i//segment_length + 1}.mp3"), format="mp3") + file_constant = os.path.splitext(os.path.basename(file_path))[0] + segment.export(os.path.join(output_dir, f"{file_constant}_segment_{i//segment_length + 1}. if __name__ == "__main__": input_file = "path/to/file.mp3" ## Set this to the location of the file you want to split. MP3 and MP4 files are compatible, but will always convert to MP3.