o
    ã¥µim  ã                   @   s  U d dl Z d dlZd dlZd dlZd dlZd dlZd dlmZ d dlm	Z	 d dl
mZmZ d dlmZmZ dd„ Zedkr€eƒ ZejZedB ed	< edu rqejZejZedu r[g Znd
d„ eD ƒZedu rig Zndd„ eD ƒZng Zg Z	 ejdd„ eeeƒD ƒeejejej ej!ej"ej#ej$ej%ej&dœZ'ed!i e'¤ŽZ(ej)ej*ej+e(ej,dej$dej-› ddœdZ.e.j/dkrpej$r/e 0¡ Z1ej2Z3e1j4e3ej5ej6ddZ7e 4ej8› dd¡Z9e9 :ej5¡ e9 ;e1 <e3¡¡ e9 =ej6¡ dZ>z/e.j?ddD ]Z@e@r	e7 Ae@¡ e9 Be@¡ qùe>se7 C¡  dZ>qùW e7 D¡  e1 E¡  e9 D¡  dS e7 D¡  e1 E¡  e9 D¡  w e.jFZGej8› dej› ZHe4eHdƒZIeI AeG¡ W d  ƒ n	1 sQw   Y  ejJeHejdZKej	rfe	eKƒ eLdeH› dƒ dS eLd e.j/› ƒ eLe. M¡ ƒ dS dS )"é    N)ÚAudioSegment)Úplay)Úaudio_to_bytesÚread_ref_text)ÚServeReferenceAudioÚServeTTSRequestc                  C   s¢  t jdt jd} | jddtddd | jdd	td
dd | jddtd dd | jddtdd dd | jddtdd dd | jddtddd | jdt jd
dd | jdtg d ¢d!d" | jd#td$d$d%gd&d' | jd(td)d*d | jd+td,d-d | jd.td/d0d | jd1td2d3d | jd4td/d5d | jd6td7d8d | jd9td:d;d | jd<td=d>d | jd?td@dAd@gdBd' | jdCtd dDd | jdEtdFdGd |  	¡ S )HNzCSend a WAV file and text to a server and receive synthesized audio.)ÚdescriptionÚformatter_classz--urlz-uzhttp://127.0.0.1:8080/v1/ttszURL of the server)ÚtypeÚdefaultÚhelpz--textz-tTzText to be synthesized)r
   Úrequiredr   z--reference_idz-idzgID of the reference model to be used for the speech
(Local: name of folder containing audios and files)z--reference_audioz-raú+zPath to the audio file)r
   Únargsr   r   z--reference_textz-rtz"Reference text for voice synthesisz--outputz-oÚgenerated_audiozOutput audio file namez--playz*Whether to play audio after receiving data)Úactionr   r   z--format)ÚwavÚmp3Úflacr   )r
   Úchoicesr   z	--latencyÚnormalÚbalancedzUsed in api.fish.audio/v1/tts)r
   r   r   r   z--max_new_tokensé   z2Maximum new tokens to generate. 
0 means no limit.z--chunk_lengthi,  zChunk length for synthesisz--top_pgš™™™™™é?zTop-p sampling for synthesisz--repetition_penaltygš™™™™™ñ?z Repetition penalty for synthesisz--temperaturezTemperature for samplingz--streamingFzEnable streaming responsez
--channelsé   zNumber of audio channelsz--rateiD¬  zSample rate for audioz--use_memory_cacheÚoffÚonz*Cache encoded references codes in memory.
z--seedza`None` means randomized inference, otherwise deterministic.
It can't be used for fixing a timbre.z	--api_keyÚYOUR_API_KEYzAPI key for authentication)
ÚargparseÚArgumentParserÚRawTextHelpFormatterÚadd_argumentÚstrÚBooleanOptionalActionÚintÚfloatÚboolÚ
parse_args)Úparser© r(   úD/home/ubuntu/.local/lib/python3.10/site-packages/tools/api_client.pyr&      sØ   þû
ÿûúúûüÿûüÿÿüÿÿÿûüür&   Ú__main__Úidstrc                 C   ó   g | ]}t |ƒ‘qS r(   )r   )Ú.0Ú	ref_audior(   r(   r)   Ú
<listcomp>   ó    r/   c                 C   r,   r(   )r   )r-   Úref_textr(   r(   r)   r/   “   r0   c                 C   s(   g | ]\}}t |d ur|nd|d‘qS )Nó    )ÚaudioÚtext)r   )r-   r1   r.   r(   r(   r)   r/   ›   s    ýÿÿ)r4   Ú
referencesÚreference_idÚformatÚmax_new_tokensÚchunk_lengthÚtop_pÚrepetition_penaltyÚtemperatureÚ	streamingÚuse_memory_cacheÚseed)ÚoptionzBearer zapplication/msgpack)Úauthorizationzcontent-type)ÚdataÚstreamÚheaderséÈ   T)r7   ÚchannelsÚrateÚoutputz.wavÚwbFr   )Ú
chunk_sizeÚ.)r7   zAudio has been saved to 'z'.z Request failed with status code r(   )Nr   Úbase64ÚwaveÚ	ormsgpackÚpyaudioÚrequestsÚpydubr   Úpydub.playbackr   Úfish_speech.utils.filer   r   Úfish_speech.utils.schemar   r   r&   Ú__name__Úargsr6   r+   r!   Ú__annotations__Úreference_audioÚ
ref_audiosÚreference_textÚ	ref_textsÚbyte_audiosr4   Úzipr7   r8   r9   r:   r;   r<   r=   r>   r?   rB   Úpydantic_dataÚpostÚurlÚpackbÚOPT_SERIALIZE_PYDANTICÚapi_keyÚresponseÚstatus_codeÚPyAudioÚpÚpaInt16Úaudio_formatÚopenrF   rG   rC   rH   ÚwfÚsetnchannelsÚsetsampwidthÚget_sample_sizeÚsetframerateÚstream_stopped_flagÚiter_contentÚchunkÚwriteÚwriteframesrawÚstop_streamÚcloseÚ	terminateÚcontentÚaudio_contentÚ
audio_pathÚ
audio_fileÚ	from_filer3   ÚprintÚjsonr(   r(   r(   r)   Ú<module>   s´   
 
tüï
þü
ÿ
€ù	þ
ÿ¢