U
    (‰d1<  ã                   @   s*  d dl Z d dlZd dlZd dlZd dlZd dlmZ d dlmZm	Z	m
Z
mZmZmZ d dlZd dlZddlmZ ddlmZ z4d dlZej ejj¡ eejjjdƒs®ed	ƒZW n ek
rÌ   ed
ƒZY nX ddœdd„Zedœdd„Z d a!da"d,e#ej$e%e#ee	e#ef  eej$ ee% ee# ee	e#ef  ddœ
dd„Z&de%e%e#de	e#eee'ee'df e
e' f  f e
d dœdd„Z(ej$e
d e'e%ej$dœdd„Z)d-e#ee%ef eee%ef  e#e#eej$ej$e	e#ef f d!œd"d#„Z*ded$œd%d&„Z+de
e' d$œd'd(„Z,d.e#e#ee
e' ee% f d)œd*d+„Z-dS )/é    N)ÚFraction)ÚAnyÚDictÚListÚOptionalÚTupleÚUnioné   )Ú_log_api_usage_onceé   )Ú
_video_optÚ	pict_typea+  Your version of PyAV is too old for the necessary video operations in torchvision.
If you are on Python 3.5, you will have to build from source (the conda-forge
packages are not up-to-date).  See
https://github.com/mikeboers/PyAV#installation for instructions on how to
install PyAV on your system.
z¼PyAV is not installed, and is necessary for the video operations in torchvision.
See https://github.com/mikeboers/PyAV#installation for instructions on how to
install PyAV on your system.
)Úreturnc                   C   s   t ttƒrt‚d S ©N©Ú
isinstanceÚavÚ	Exception© r   r   ú8/tmp/pip-unpacked-wheel-vx7f76es/torchvision/io/video.pyÚ_check_av_available(   s    
r   c                   C   s   t ttƒ S r   r   r   r   r   r   Ú_av_available-   s    r   é
   Úlibx264)
ÚfilenameÚvideo_arrayÚfpsÚvideo_codecÚoptionsÚaudio_arrayÚ	audio_fpsÚaudio_codecÚaudio_optionsr   c	                 C   sÚ  t j ¡ st j ¡ sttƒ tƒ  t j|t jd 	¡ }t
|tƒrJt |¡}tj| ddv}	|	j||d}
|jd |
_|jd |
_|dkrŽdnd	|
_|pši |
_|d
k	rtdddddddddddœ
}|	j||d}|pÖi |_|jd }|dkrðdnd}|	jjd jj}t || ¡}t  |¡ 	¡  |¡}tjj|||d}||_| |¡D ]}|	  |¡ qH| ¡ D ]}|	  |¡ qb|D ]8}tj!j|d	d}d|_"|
 |¡D ]}|	  |¡ qœqx|
 ¡ D ]}|	  |¡ qºW 5 Q R X d
S )a|  
    Writes a 4d tensor in [T, H, W, C] format in a video file

    Args:
        filename (str): path where the video will be saved
        video_array (Tensor[T, H, W, C]): tensor containing the individual frames,
            as a uint8 tensor in [T, H, W, C] format
        fps (Number): video frames per second
        video_codec (str): the name of the video codec, i.e. "libx264", "h264", etc.
        options (Dict): dictionary containing options to be passed into the PyAV video stream
        audio_array (Tensor[C, N]): tensor containing the audio, where C is the number of channels
            and N is the number of samples
        audio_fps (Number): audio sample rate, typically 44100 or 48000
        audio_codec (str): the name of the audio codec, i.e. "mp3", "aac", etc.
        audio_options (Dict): dictionary containing options to be passed into the PyAV audio stream
    ©ÚdtypeÚw)Úmode)Úrater	   r   Z
libx264rgbZyuv420pZrgb24Nz<f8z<f4z<i2z<i4Úu1)
ZdblZdblpZfltZfltpZs16Zs16pZs32Zs32pÚu8Zu8pr   ZstereoZmono)ÚformatZlayout)r*   ÚNONE)#ÚtorchÚjitÚis_scriptingÚ
is_tracingr
   Úwrite_videor   Ú	as_tensorÚuint8Únumpyr   ÚfloatÚnpÚroundr   ÚopenZ
add_streamÚshapeÚwidthÚheightZpix_fmtr   ÚstreamsÚaudior*   Únamer$   ZastypeZ
AudioFrameZfrom_ndarrayZsample_rateÚencodeZmuxÚ
VideoFramer   )r   r   r   r   r   r   r    r!   r"   Ú	containerÚstreamZaudio_format_dtypesZa_streamZnum_channelsZaudio_layoutZaudio_sample_fmtZformat_dtypeÚframeÚpacketÚimgr   r   r   r0   6   sX    



ö

r0   zav.container.Containerzav.stream.Stream.zav.frame.Frame)r@   Ústart_offsetÚ
end_offsetÚpts_unitrA   Ústream_namer   c                    s.  t d7 a t t td kr t ¡  |dkrftt ˆd|j  ¡ƒ‰ˆ tdƒkrptt 	ˆ d|j  ¡ƒ‰ n
t
 d¡ i ‰d}d}|jdkræ|jj}|ræd|kræ| d¡}	||	d … }
t d	|
¡}|d krÐt d
|
¡}|d k	ræ| d¡dk}ˆ}t|d dƒ}|rt|| dƒ}z| j|dd|d W n tjk
r>   g  Y S X d}zXt| jf |ŽƒD ]B\}}|ˆ|j< |jˆ krV|r||k r|d7 }qV qšqVW n tjk
r´   Y nX ‡ ‡‡fdd„tˆƒD ƒ}tˆƒdkr*ˆdkr*ˆˆkr*‡fdd„ˆD ƒ}t|ƒdkr*t|ƒ}| dˆ| ¡ |S )Nr   ÚsecÚinfzBThe pts_unit 'pts' gives wrong results. Please use pts_unit 'sec'.Té   Úvideos   DivXs   DivX(\d+)Build(\d+)(\w)s   DivX(\d+)b(\d+)(\w)é   ó   pr   F)Z	any_frameZbackwardrA   c                    s2   g | ]*}ˆˆ| j   kr"ˆ krn qˆ| ‘qS r   ©Úpts©Ú.0Úi©rF   ÚframesrE   r   r   Ú
<listcomp>Ò   s
        z%_read_from_stream.<locals>.<listcomp>c                    s   g | ]}|ˆ k r|‘qS r   r   rQ   )rE   r   r   rV   ×   s      )Ú_CALLED_TIMESÚ_GC_COLLECTION_INTERVALÚgcZcollectÚintÚmathÚfloorÚ	time_baser4   ÚceilÚwarningsÚwarnÚtypeÚcodec_contextÚ	extradataÚfindÚreÚsearchÚgroupÚmaxÚseekr   ÚAVErrorÚ	enumerateÚdecoderP   ÚsortedÚlenÚinsert)r@   rE   rF   rG   rA   rH   Zshould_bufferÚmax_buffer_sizerc   ÚposÚdÚoZseek_offsetZbuffer_countZ_idxrB   ÚresultZpreceding_framesZfirst_frame_ptsr   rT   r   Ú_read_from_streamŽ   s^    	




"ru   )ÚaframesÚaudio_framesÚ	ref_startÚref_endr   c           
      C   s|   |d j |d j  }}| jd }|| d | }d}|}	||k rPt|| | ƒ}||krht|| | ƒ}	| d d …||	…f S )Nr   éÿÿÿÿr   )rP   r8   rZ   )
rv   rw   rx   ry   ÚstartÚendZtotal_aframesZstep_per_aframeZs_idxZe_idxr   r   r   Ú_align_audio_framesÞ   s    
r}   rP   ÚTHWC)r   Ú	start_ptsÚend_ptsrG   Úoutput_formatr   c              	   C   s|  t j ¡ st j ¡ sttƒ | ¡ }|dkr<td|› dƒ‚ddlm	} t
j | ¡sbtd| › ƒ‚|ƒ dkr|t | |||¡S tƒ  |dkr’td	ƒ}||k r®td
|› d|› ƒ‚i }g }g }tj}	zºtj| dd¢}
|
jjrè|
jjd j}	|
jjr4t|
||||
jjd ddiƒ}|
jjd j}|dk	r4t|ƒ|d< |
jjrnt|
||||
jjd ddiƒ}|
jjd j|d< W 5 Q R X W n tjk
r’   Y nX dd„ |D ƒ}dd„ |D ƒ}|rÈt  t |¡¡}nt j dt j!d}|rHt "|d¡}t  |¡}|dkr8t#t$ %|d|	  ¡ƒ}|td	ƒkr8t#t$ &|d|	  ¡ƒ}t'||||ƒ}nt j dt j(d}|dkrr| )dddd¡}|||fS )a  
    Reads a video from a file, returning both the video frames as well as
    the audio frames

    Args:
        filename (str): path to the video file
        start_pts (int if pts_unit = 'pts', float / Fraction if pts_unit = 'sec', optional):
            The start presentation time of the video
        end_pts (int if pts_unit = 'pts', float / Fraction if pts_unit = 'sec', optional):
            The end presentation time
        pts_unit (str, optional): unit in which start_pts and end_pts values will be interpreted,
            either 'pts' or 'sec'. Defaults to 'pts'.
        output_format (str, optional): The format of the output video tensors. Can be either "THWC" (default) or "TCHW".

    Returns:
        vframes (Tensor[T, H, W, C] or Tensor[T, C, H, W]): the `T` video frames
        aframes (Tensor[K, L]): the audio frames, where `K` is the number of channels and `L` is the number of points
        info (Dict): metadata for the video and audio. Can contain the fields video_fps (float) and audio_fps (int)
    )r~   ÚTCHWz5output_format should be either 'THWC' or 'TCHW', got Ú.r   ©Úget_video_backendzFile not found: ÚpyavNrJ   z7end_pts should be larger than start_pts, got start_pts=z and end_pts=Úignore©Zmetadata_errorsrL   Ú	video_fpsr<   r    c                 S   s   g | ]}|  ¡  ¡ ‘qS r   )Zto_rgbÚ
to_ndarray©rR   rB   r   r   r   rV   D  s     zread_video.<locals>.<listcomp>c                 S   s   g | ]}|  ¡ ‘qS r   )rŠ   r‹   r   r   r   rV   E  s     )r   r   r   rM   r#   r   rI   )r   r   r‚   rM   r	   )*r,   r-   r.   r/   r
   Ú
read_videoÚupperÚ
ValueErrorÚtorchvisionr…   ÚosÚpathÚexistsÚRuntimeErrorr   Z_read_videor   r4   Zdefault_timebaser   r7   r;   r<   r]   rL   ru   Úaverage_rater'   rj   r1   r5   ÚstackÚemptyr2   ZconcatenaterZ   r[   r\   r^   r}   Zfloat32Zpermute)r   r   r€   rG   r   r…   ÚinfoZvideo_framesrw   Zaudio_timebaser@   r‰   Zvframes_listZaframes_listZvframesrv   r   r   r   rŒ   í   s€    


ú


ú 


rŒ   )r@   r   c                 C   s*   | j d jj}|d krdS d|kr&dS dS )Nr   Fs   LavcT)r;   rb   rc   )r@   rc   r   r   r   Ú!_can_read_timestamps_from_packets^  s    r˜   c                 C   s8   t | ƒrdd„ | jddD ƒS dd„ | jddD ƒS d S )Nc                 S   s   g | ]}|j d k	r|j ‘qS r   rO   ©rR   Úxr   r   r   rV   j  s     
 z,_decode_video_timestamps.<locals>.<listcomp>r   )rL   c                 S   s   g | ]}|j d k	r|j ‘qS r   rO   r™   r   r   r   rV   l  s     
 )r˜   Zdemuxrl   )r@   r   r   r   Ú_decode_video_timestampsg  s    r›   )r   rG   r   c           	   
      s2  t j ¡ st j ¡ sttƒ ddlm} |ƒ dkr>t 	| |¡S t
ƒ  d}g }zvtj| dd^}|jjr¶|jjd }|j‰ zt|ƒ}W n& tjk
rª   t d| › ¡ Y nX t|jƒ}W 5 Q R X W nB tjk
r } z d| › d	|› }t |t¡ W 5 d}~X Y nX | ¡  |d
kr*‡ fdd„|D ƒ}||fS )a   
    List the video frames timestamps.

    Note that the function decodes the whole video frame-by-frame.

    Args:
        filename (str): path to the video file
        pts_unit (str, optional): unit in which timestamp values will be returned
            either 'pts' or 'sec'. Defaults to 'pts'.

    Returns:
        pts (List[int] if pts_unit = 'pts', List[Fraction] if pts_unit = 'sec'):
            presentation timestamps for each one of the frames in the video.
        video_fps (float, optional): the frame rate for the video

    r   r„   r†   Nr‡   rˆ   z Failed decoding frames for file zFailed to open container for z; Caught error: rI   c                    s   g | ]}|ˆ  ‘qS r   r   r™   ©Zvideo_time_baser   r   rV     s     z)read_video_timestamps.<locals>.<listcomp>)r,   r-   r.   r/   r
   Úread_video_timestampsr   r…   r   Z_read_video_timestampsr   r   r7   r;   rL   r]   r›   rj   r_   r`   r4   r”   ÚRuntimeWarningÚsort)	r   rG   r…   r‰   rP   r@   Zvideo_streamÚeÚmsgr   rœ   r   r   o  s2    

r   )r   NNNNN)r   NrP   r~   )rP   ).rY   r[   r   re   r_   Z	fractionsr   Útypingr   r   r   r   r   r   r3   r5   r,   Úutilsr
   Ú r   r   ÚloggingZ	set_levelÚERRORÚhasattrrL   rB   r?   ÚImportErrorr   Úboolr   rW   rX   ÚstrZTensorr4   r0   rZ   ru   r}   rŒ   r˜   r›   r   r   r   r   r   Ú<module>   s    ÿ	ÿ
	      ÷öY$ùQ   þ    û
úq	