o
    €o™iÏ:  ã                
   @   s$  U d dl Z d dlmZmZmZmZ d dlZd dlm  m	Z
 d dlmZmZmZ d dlmZ d dlmZmZ d dlmZ d dlmZmZ dd	lmZ dd
lmZmZmZ i Zee e f e!d< ded< G dd„ deƒZ"G dd„ deƒZ#dedee$e$f defdd„Z%dedede$de$def
dd„Z&dS )é    N)ÚAnyÚDictÚOptionalÚTuple)ÚModuleÚTensorÚconcatenate)ÚKORNIA_CHECK_SHAPE)ÚDetectorCfgÚLineMatcherCfg)Únormalize_pixel_coordinates)Údataclass_to_dictÚdict_to_dataclassé   )ÚSOLD2Net)ÚLineSegmentDetectionModuleÚline_map_to_segmentsÚprob_to_junctionsÚurlsz<http://cmp.felk.cvut.cz/~mishkdmy/models/sold2_wireframe.pthÚ	wireframec                
       sŽ   e Zd ZdZddedee ddf‡ fdd„Zd	ede	e
ef fd
d„Zdededededef
dd„Zde	e
ef de	e
ef fdd„Z‡  ZS )ÚSOLD2u  Module, which detects and describe line segments in an image.

    This is based on the original code from the paper "SOLDÂ²: Self-supervised
    Occlusion-aware Line Detector and Descriptor". See :cite:`SOLD22021` for more details.

    Args:
        config: Dict specifying parameters. None will load the default parameters,
            which are tuned for images in the range 400~800 px.
        pretrained: If True, download and set pretrained weights to the model.

    Returns:
        The raw junction and line heatmaps, the semi-dense descriptor map,
        as well as the list of detected line segments (ij coordinates convention).

    Example:
        >>> images = torch.rand(2, 1, 64, 64)
        >>> sold2 = SOLD2()
        >>> outputs = sold2(images)
        >>> line_seg1 = outputs["line_segments"][0]
        >>> line_seg2 = outputs["line_segments"][1]
        >>> desc1 = outputs["dense_desc"][0]
        >>> desc2 = outputs["dense_desc"][1]
        >>> matches = sold2.match(line_seg1, line_seg2, desc1[None], desc2[None])

    TNÚ
pretrainedÚconfigÚreturnc                    sØ   t |tƒrtjdtdd t|tƒ}tƒ  ¡  |d ur|ntƒ | _	d| j	_
| j	j| _| j	j| _| j	j| _tt| j	ƒƒ| _|rXtjjtd t d¡d}|  |d ¡}| j |¡ |  ¡  t| j	jƒ| _t| j	jƒ| _d S )	NzÌUsage of config as a plain dictionary is deprecated in favor of `kornia.features.sold2.structures.DetectorCfg`. The support of plain dictionariesas config will be removed in kornia v0.8.0 (December 2024).é   )ÚcategoryÚ
stacklevelTr   Úcpu)Úmap_locationÚmodel_state_dict) Ú
isinstanceÚdictÚwarningsÚwarnÚDeprecationWarningr   r
   ÚsuperÚ__init__r   Úuse_descriptorÚ	grid_sizeÚdetection_threshÚjunc_detect_threshÚmax_num_junctionsr   r   ÚmodelÚtorchÚhubÚload_state_dict_from_urlr   ÚdeviceÚadapt_state_dictÚload_state_dictÚevalr   Úline_detector_cfgÚline_detectorÚWunschLineMatcherÚline_matcher_cfgÚline_matcher)Úselfr   r   Úpretrained_dictÚ
state_dict©Ú	__class__© úN/home/ubuntu/.local/lib/python3.10/site-packages/kornia/feature/sold2/sold2.pyr&   @   s*   
û




zSOLD2.__init__Úimgc           
      C   s¤   t |g d¢ƒ i }|  |¡}|d |d< |d |d< |d |d< g }t|d |d ƒD ] \}}t|| j| j| jƒ}| j ||¡\}}}	| 	t
||ƒ¡ q+||d< |S )	aÍ  Run forward.

        Args:
            img: batched images with shape :math:`(B, 1, H, W)`.

        Returns:
            line_segments: list of N line segments in each of the B images :math:`List[(N, 2, 2)]`.
            junction_heatmap: raw junction heatmap of shape :math:`(B, H, W)`.
            line_heatmap: raw line heatmap of shape :math:`(B, H, W)`.
            dense_desc: the semi-dense descriptor map of shape :math:`(B, 128, H/4, W/4)`.

        )ÚBÚ1ÚHÚWÚ	junctionsÚjunction_heatmapÚheatmapÚline_heatmapÚdescriptorsÚ
dense_descÚline_segments)r	   r,   Úzipr   r(   r*   r+   r5   ÚdetectÚappendr   )
r9   r@   ÚoutputsÚnet_outputsÚlinesÚ	junc_probrG   rE   Úline_mapÚ_r>   r>   r?   Úforward`   s   
zSOLD2.forwardÚ	line_seg1Ú	line_seg2Údesc1Údesc2c                 C   s   |   ||||¡S )a—  Find the best matches between two sets of line segments and their corresponding descriptors.

        Args:
            line_seg1: list of line segments in image 1, with shape [num_lines, 2, 2].
            line_seg2: list of line segments in image 2, with shape [num_lines, 2, 2].
            desc1: semi-dense descriptor map of image 1, with shape [1, 128, H/4, W/4].
            desc2: semi-dense descriptor map of image 2, with shape [1, 128, H/4, W/4].

        Returns:
            A np.array of size [num_lines1] indicating the index in line_seg2 of the matched line,
            for each line in line_seg1. -1 means that the line is not matched.

        )r8   )r9   rV   rW   rX   rY   r>   r>   r?   Úmatchƒ   s   zSOLD2.matchr;   c                 C   s:   |d= |d= |d= |d |d< |d |d< |d= |d= |S )NÚw_juncÚ	w_heatmapÚw_descz'heatmap_decoder.conv_block_lst.2.weightz)heatmap_decoder.conv_block_lst.2.0.weightz%heatmap_decoder.conv_block_lst.2.biasz'heatmap_decoder.conv_block_lst.2.0.biasr>   )r9   r;   r>   r>   r?   r1   “   s   zSOLD2.adapt_state_dict)TN)Ú__name__Ú
__module__Ú__qualname__Ú__doc__Úboolr   r
   r&   r   r   Ústrr   rU   rZ   r1   Ú__classcell__r>   r>   r<   r?   r   %   s      #*r   c                
       sŒ   e Zd ZdZddee ddf‡ fdd„Zdeded	ed
edef
dd„Zdede	eef fdd„Z
dedefdd„Zdedefdd„Z‡  ZS )r6   z†Class matching two sets of line segments with the Needleman-Wunsch algorithm.

    TODO: move it later in kornia.feature.matching
    Nr   r   c                    s^   t ƒ  ¡  |d u rtƒ }|| _| jj| _| jj| _| jj| _| jj| _| jj| _| jj	| _	d S ©N)
r%   r&   r   r   Úcross_checkÚnum_samplesÚmin_dist_ptsÚtop_k_candidatesr(   Ú
line_score)r9   r   r<   r>   r?   r&   ¤   s   



zWunschLineMatcher.__init__rV   rW   rX   rY   c                 C   s  t |g d¢ƒ t |g d¢ƒ t |g d¢ƒ t |g d¢ƒ |j}|jd | j |jd | j f}|jd | j |jd | j f}t|ƒdkrNtjdtj|dS t|ƒdkr`tjt|ƒtj|d S |  	|¡\}}	|  	|¡\}
}| 
dd¡}|
 
dd¡}
t||ƒ}t|
|ƒ}tjtj||dd	dd
d
…d
d
…df dd}tjtj||dd	dd
d
…d
d
…df dd}| ¡ | }d||	 ¡  < d|d
d
…| ¡  f< | 
t|ƒ| jt|ƒ| j¡}| dddd¡}|  |¡}| jr|  | dddd¡¡}|| tjt|ƒ|dk}d|| < |S )z\Find the best matches between two sets of line segments and their corresponding descriptors.)ÚNÚ2rl   )rA   ÚDrC   rC   r   é   r   ©Údtyper0   éÿÿÿÿF)Úalign_cornersN©Údimr   ©r0   )r	   r0   Úshaper(   Úlenr-   ÚemptyÚintÚonesÚsample_line_pointsÚreshapeÚkeypoints_to_gridÚFÚ	normalizeÚgrid_sampleÚtÚflattenrg   ÚpermuteÚfilter_and_match_linesrf   Úarange)r9   rV   rW   rX   rY   r0   Ú	img_size1Ú	img_size2Úline_points1Úvalid_points1Úline_points2Úvalid_points2Úgrid1Úgrid2ÚscoresÚmatchesÚmatches2Úmutualr>   r>   r?   rU   ±   s<     

..

zWunschLineMatcher.forwardÚline_segc                 C   s  |j \}}}| j}|j}tj|dd…df |dd…df  dd}tj|| j  ¡  ¡ d|d}|dd…df  	d¡}|dd…df |dd…df   	d¡}	tj
||d 	d¡}
|d  	d¡}|
| }||	| 	d¡  }|
| 	d¡k }| | 	d¡ d	¡}||fS )
aE  Regularly sample points along each line segments, with a minimal distance between each point.

        Pad the remaining points.

        Args:
            line_seg: an Nx2x2 Tensor.

        Returns:
            line_points: an N x num_samples x 2 Tensor.
            valid_points: a boolean N x num_samples Tensor.
        Nr   r   rs   r   )ÚminÚmaxru   rq   g        )rv   rg   r0   r-   ÚnormÚclamprh   Úfloorry   Ú	unsqueezer…   Úmasked_fill)r9   r’   Ú_NrT   ÚMÚdevÚlengthsÚnum_ptsÚorigÚdirsÚidxÚdenomÚalphaÚptsÚvalidr>   r>   r?   r{   á   s   *&z$WunschLineMatcher.sample_line_pointsrŽ   c                 C   s>  t |g d¢ƒ | d¡d }|dk}||  d¡| d¡ }| d¡d }|dk}||  d¡| d¡ }|| d }tj|dddd…| j d…f }tj||dd…dd…ddf dd}t|tj|dgd	gdƒ}|j	\}	}
}}| 
|	|
 ||f¡}|  |¡}| 
|	|
¡}t tj|dd|
d ¡}|t |	¡|f }|S )
az  Use scores to keep the top k best lines.

        Compute the Needleman- Wunsch algorithm on each candidate pairs, and keep the highest score.

        Args:
            scores: a (N, M, n, n) Tensor containing the pairwise scores
                    of the elements to match.

        Returns:
            matches: a (N) Tensor containing the indices of the best match
        )r›   rk   Únr¦   rn   r   rq   r   r   rs   N)Údims)r	   r”   Úsumr-   Úargsortri   Útake_along_dimr   Úfliprv   r|   Úneedleman_wunschÚ	remainderÚargmaxr…   )r9   rŽ   Úline_scores1Úvalid_scores1Úline_scores2Úvalid_scores2Úline_scoresÚ
topk_linesÚ
top_scoresÚn_lines1Útop2kr¦   ÚmÚ	nw_scoresr   r>   r>   r?   r„   ÿ   s$   "$
z(WunschLineMatcher.filter_and_match_linesc                 C   s(  t |g d¢ƒ d}|j\}}}tj||d |d |jd}|| }td|| d ƒD ]`}td|| ƒ}	t||d ƒ}
tj|	|
d |jd}|| }|dd…|d |f }|dd…||d f }|dd…|d |d f |dd…|d |d f  }t t ||¡|¡|dd…||f< q*|dd…ddf S )a0  Batched implementation of the Needleman-Wunsch algorithm.

        The cost of the InDel operation is set to 0 by subtracting the gap
        penalty to the scores.

        Args:
            scores: a (B, N, M) Tensor containing the pairwise scores
                    of the elements to match.
        )rA   rk   r›   gš™™™™™¹?r   ru   r   Nrq   )	r	   rv   r-   Úzerosr0   Úranger”   r“   r…   )r9   rŽ   ÚgaprA   rk   r›   ÚdpÚSÚkÚi_minÚi_maxÚiÚjÚupÚleftÚdiagr>   r>   r?   r¬   '  s   
4$z"WunschLineMatcher.needleman_wunschre   )r^   r_   r`   ra   r   r   r&   r   rU   r   r{   r„   r¬   rd   r>   r>   r<   r?   r6   ž   s    0(r6   Ú	keypointsÚimg_sizer   c                 C   sN   t | ddgƒ t| ƒ}t| dd…ddgf |d |d ƒ}| d|dd¡}|S )uú   Convert a list of keypoints into a grid in [-1, 1]Â² that can be used in torch.nn.functional.interpolate.

    Args:
        keypoints: a tensor [N, 2] of N keypoints (ij coordinates convention).
        img_size: the original image size (H, W)

    rk   rl   Nr   r   rq   r   )r	   rw   r   Úview)rÇ   rÈ   Ún_pointsÚgrid_pointsr>   r>   r?   r}   C  s
   $r}   ÚstartÚendÚsteprt   c                 C   s^   ||  |d    |¡}dgt|jƒ }|||< tj|tj| jd |¡}|   |¡||  }|S )z<Batch version of torch.normalize (similar to the numpy one).r   ro   )r˜   rw   rv   r-   r…   Úfloatr0   r|   )rÌ   rÍ   rÎ   rt   Ú	intervalsÚbroadcast_sizeÚsamplesr>   r>   r?   Úbatched_linspaceR  s   rÓ   )'r"   Útypingr   r   r   r   r-   Útorch.nn.functionalÚnnÚ
functionalr~   Úkornia.corer   r   r   Úkornia.core.checkr	   Úkornia.feature.sold2.structuresr
   r   Úkornia.geometry.conversionsr   Úkornia.utilsr   r   Ú	backbonesr   Úsold2_detectorr   r   r   r   rc   Ú__annotations__r   r6   ry   r}   rÓ   r>   r>   r>   r?   Ú<module>   s$   
y &"