o ¾e¦i<ã@sÎddlZddlZddlmZddlmZmZmZddl m Z mZmZm Z mZmZmZeƒr3ddlmZeƒr9óz2LwDetrHungarianMatcher.forward..cSr©Úboxesrrrrrr:rgÐ?g@g:Œ0âŽyE>)ÚpéÿÿÿÿcSóg|]}t|dƒ‘qSr ©ÚlenrrrrrQó©ÚdimcSsg|] \}}t||ƒ‘qSrr)rÚiÚcrrrrWscsDg|]\}}t |d|dˆˆg¡t |d|dg¡f‘qS)rr)ÚnpÚconcatenate)rÚindice1Úindice2©Úgroup_idÚgroup_num_queriesrrr[sýþÿcSs0g|]\}}tj|tjdtj|tjdf‘qS))Údtype)ÚtorchÚ as_tensorÚint64)rr*Újrrrrbs0)ÚshapeÚflattenÚsigmoidr4ÚcatÚlogr3ÚtoÚfloat32ÚcdistrrÚ bbox_costÚ class_costÚ giou_costÚviewÚcpuÚsplitÚrangeÚ enumerateÚzip)ÚselfÚoutputsÚtargetsÚ group_detrÚ batch_sizeÚnum_queriesÚout_probÚout_bboxÚ target_idsÚtarget_bboxÚalphaÚgammaÚneg_cost_classÚpos_cost_classrAr3r@rBÚcost_matrixÚsizesÚindicesÚcost_matrix_listÚgroup_cost_matrixÚ group_indicesrr0rÚforward+s>" ûzLwDetrHungarianMatcher.forwardN)Ú__name__Ú __module__Ú__qualname__r4Úno_gradr]rrrrr*srcsdeZdZ‡fdd„Zdd„Ze ¡dd„ƒZdd„Zd d „Z dd„Z d d„Zdd„Zdd„Z ‡ZS)ÚLwDetrImageLosscs,tƒ ¡||_||_||_||_||_dS©N)ÚsuperÚ__init__ÚmatcherÚnum_classesÚfocal_alphaÚlossesrL)rIrfrgrhrirL©Ú __class__rrrefs zLwDetrImageLoss.__init__cCsJd|vrtdƒ‚|d}| |¡}t dd„t||ƒDƒ¡}|j}d} |d|} tjdd„t||ƒDƒdd }t tt| ¡ƒt|ƒƒd¡}| |j¡}| ¡ ¡} | ¡}t |¡}|| }t|ƒ}| |¡|| |¡| d |¡}t |d¡ ¡}|||<d |||<|| ¡|d | ¡}| ¡|}d|i}|S) Nrz#No logits were found in the outputscSó g|]\}\}}|d|‘qSrr)rÚtÚ_ÚJrrrruó z/LwDetrImageLoss.loss_labels..rrcSrlr r©rrmrnr*rrrryrprr(rg{®Gáz„?Úloss_ce)ÚKeyErrorÚ_get_source_permutation_idxr4r;rHrhÚdiagr rÚdetachr=r3Úcloner:Ú zeros_likeÚlistÚappendÚpowÚclampr<Úsum)rIrJrKrYÚ num_boxesÚ source_logitsÚidxÚtarget_classes_orSrTÚ src_boxesÚtarget_boxesÚiou_targetsÚpos_iousÚprobÚpos_weightsÚneg_weightsÚpos_indrmrrrirrrÚloss_labelsos6 ÿ zLwDetrImageLoss.loss_labelscCsb|d}|j}tjdd„|Dƒ|d}| ¡ d¡jdk d¡}tj | ¡| ¡¡} d| i} | S) zâ Compute the cardinality error, i.e. the absolute error in the number of predicted non-empty boxes. This is not really a loss, it is intended for logging purposes only. It doesn't propagate gradients. rcSr$rr%rrrrrœr'z4LwDetrImageLoss.loss_cardinality..)Údevicer#gà?rÚcardinality_error)r‹r4r5r:ÚmaxÚvaluesr}ÚnnÚ functionalÚl1_lossÚfloat)rIrJrKrYr~rr‹Útarget_lengthsÚ card_predÚcard_errrirrrÚloss_cardinality“sz LwDetrImageLoss.loss_cardinalitycCsšd|vrtdƒ‚| |¡}|d|}tjdd„t||ƒDƒdd}tjj||dd}i} | ¡|| d <d t t t|ƒt|ƒƒ¡} | ¡|| d<| S)a< Compute the losses related to the bounding boxes, the L1 regression loss and the GIoU loss. Targets dicts must contain the key "boxes" containing a tensor of dim [nb_target_boxes, 4]. The target boxes are expected in format (center_x, center_y, w, h), normalized by the image size. rz#No predicted boxes found in outputscSrlr rrqrrrr¯rpz.LwDetrImageLoss.loss_boxes..rr(Únone)Ú reductionÚ loss_bboxrÚ loss_giou)rsrtr4r;rHrrr‘r}rurr)rIrJrKrYr~r€Úsource_boxesrƒr™riršrrrÚ loss_boxes¤s ÿzLwDetrImageLoss.loss_boxescCsØd|vrtdƒ‚| |¡}| |¡}|d}||}dd„|Dƒ}t|ƒ ¡\} } | |¡} | |} tjj|dd…df| j dd…ddd }|dd…d f d¡}| d¡} | |j ¡} t|| |ƒt || |ƒdœ}|S) zÄ Compute the losses related to the masks: the focal loss and the dice loss. Targets dicts must contain the key "masks" containing a tensor of dim [nb_target_boxes, h, w]. Ú pred_masksz#No predicted masks found in outputscSr)Úmasksr©rrmrrrrÊrz.LwDetrImageLoss.loss_masks..NéþÿÿÿÚbilinearF)ÚsizeÚmodeÚ align_cornersrr)Ú loss_maskÚ loss_dice)rsrtÚ_get_target_permutation_idxrÚ decomposer=rrÚinterpolater8r9rCr r )rIrJrKrYr~Ú source_idxÚ target_idxÚsource_masksržÚtarget_masksÚvalidrirrrÚ loss_masks½s( ÿ þzLwDetrImageLoss.loss_maskscCó4t dd„t|ƒDƒ¡}t dd„|Dƒ¡}||fS)NcSs g|]\}\}}t ||¡‘qSr©r4Ú full_like)rr*Úsourcernrrrrárpz?LwDetrImageLoss._get_source_permutation_idx..cSsg|]\}}|‘qSrr)rr³rnrrrrâr©r4r;rG)rIrYÚ batch_idxrªrrrrtßóz+LwDetrImageLoss._get_source_permutation_idxcCr°)NcSs g|]\}\}}t ||¡‘qSrr±)rr*rnÚtargetrrrrèrpz?LwDetrImageLoss._get_target_permutation_idx..cSsg|]\}}|‘qSrr)rrnr·rrrrérr´)rIrYrµr«rrrr§ær¶z+LwDetrImageLoss._get_target_permutation_idxcCs@|j|j|j|jdœ}||vrtd|›dƒ‚||||||ƒS)N)ÚlabelsÚcardinalityr!ržzLoss z not supported)rŠr–rœr¯Ú ValueError)rIÚlossrJrKrYr~Úloss_maprrrÚget_lossìsüzLwDetrImageLoss.get_lossc s |jr|jnd}dd„| ¡Dƒ}| |||¡}tdd„|Dƒƒ}||}tj|gtjtt | ¡ƒƒjd}d}tƒrHt jikrHt|ƒ}t ƒj}tj||dd ¡}i}|jD]} | | | ||||¡¡qXd|vr¡t|dƒD]/\‰} | | ||¡}|jD] } | d kr†q| | | |||¡}‡fd d„| ¡Dƒ}| |¡qqqd|vrÎ|d}|j|||d}|jD]} | | ||||¡}d d„| ¡Dƒ}| |¡q´|S)aª This performs the loss computation. Args: outputs (`dict`, *optional*): Dictionary of tensors, see the output specification of the model for the format. targets (`list[dict]`, *optional*): List of dicts, such that `len(targets) == batch_size`. The expected keys in each dict depends on the losses applied, see each loss' doc. rcSs&i|]\}}|dkr|dkr||“qS)Úenc_outputsÚauxiliary_outputsr©rÚkrrrrÚ s z+LwDetrImageLoss.forward..css|] }t|dƒVqdS)rNr%rŸrrrÚ s€z*LwDetrImageLoss.forward..)r3r‹)Úminr¿ržcó i|]\}}|dˆ›|“qS©rnrrÀ©r*rrrÂ#rpr¾)rLcSói|] \}}|d|“qS©Ú_encrrÀrrrrÂ+ó)ÚtrainingrLÚitemsrfr}r4r5r’ÚnextÚiterrŽr‹rrÚ _shared_staterÚ num_processesr|ÚitemriÚupdater½rG) rIrJrKrLÚoutputs_without_aux_and_encrYr~Ú world_sizerir»r¿Úl_dictr¾rrÇrr]÷sFÿ" ú zLwDetrImageLoss.forward)r^r_r`rerŠr4rar–rœr¯rtr§r½r]Ú __classcell__rrrjrrbes $ "rbc st|j|j|jd} gd¢}t| |j|j||jd}| |¡i} d}|| d<|| d<||dœ| d<|j r>t ||ƒ}|| d<|| |ƒ‰d |jd œ‰|jˆd<|j rpi}t |jd ƒD]‰| ‡fdd „ˆ ¡Dƒ¡qZˆ |¡dd „ˆ ¡Dƒ}ˆ |¡t‡‡fdd„ˆDƒƒ}|ˆ|fS)N)rAr@rB)r¸r!r¹)rfrgrhrirLrr)rrr¾r¿r)rrr™ršcrÅrÆrrÀrÇrrrÂ^rpz0LwDetrForObjectDetectionLoss..cSrÈrÉrrÀrrrrÂ`rËc3s(|]}|ˆvrˆ|ˆ|VqdSrcr)rrÁ)Ú loss_dictÚweight_dictrrrÃbs€&z/LwDetrForObjectDetectionLoss..)rrAr@rBrbÚ num_labelsrhrLr=Úauxiliary_lossrÚbbox_loss_coefficientÚgiou_loss_coefficientrFÚdecoder_layersrÓrÍr})rr¸r‹rÚconfigÚ outputs_classÚ outputs_coordÚenc_outputs_classÚenc_outputs_coordÚkwargsrfriÚ criterionÚoutputs_lossr¿Úaux_weight_dictÚenc_weight_dictr»r)r*rØrÙrÚLwDetrForObjectDetectionLoss1sD ÿû þ ré)NNNN)Únumpyr,r4Útorch.nnrÚutilsrrrÚloss_for_object_detectionrrr r rrr Útransformers.image_transformsrÚscipy.optimizerÚ acceleraterÚaccelerate.utilsrrÚModulerbrérrrrÚs( $;S÷