Spaces:

ryhm
/

AttriDet

Running

App Files Files Community

AttriDet / utils /loss.py

ryhm

Upload 253 files

ee8e6f1 verified 15 days ago

raw

history blame

50.4 kB

	# YOLOv5 🚀 by Ultralytics, AGPL-3.0 license
	"""Loss functions."""

	import torch
	import torch.nn as nn
	import torchvision
	import torch.nn.functional as F
	from utils.metrics import bbox_iou
	from utils.torch_utils import de_parallel
	from torch.nn.functional import cosine_similarity
	import numpy as np
	from utils.general import (
	LOGGER,
	TQDM_BAR_FORMAT,
	Profile,
	xywh2xyxy,
	xyxy2xywh,
	non_max_suppression_ps,
	scale_boxes,
	get_fixed_xyxy,

	)


	def smooth_BCE(eps=0.1):
	"""Returns label smoothing BCE targets for reducing overfitting; pos: `1.0 - 0.5eps`, neg: `0.5eps`. For details see https://github.com/ultralytics/yolov3/issues/238#issuecomment-598028441"""
	return 1.0 - 0.5 * eps, 0.5 * eps


	class BCEBlurWithLogitsLoss(nn.Module):
	# BCEwithLogitLoss() with reduced missing label effects.
	def __init__(self, alpha=0.05):
	"""Initializes a modified BCEWithLogitsLoss with reduced missing label effects, taking optional alpha smoothing
	parameter.
	"""
	super().__init__()
	self.loss_fcn = nn.BCEWithLogitsLoss(reduction="none") # must be nn.BCEWithLogitsLoss()
	self.alpha = alpha

	def forward(self, pred, true):
	"""Computes modified BCE loss for YOLOv5 with reduced missing label effects, taking pred and true tensors,
	returns mean loss.
	"""
	loss = self.loss_fcn(pred, true)
	pred = torch.sigmoid(pred) # prob from logits
	dx = pred - true # reduce only missing label effects
	# dx = (pred - true).abs() # reduce missing label and false label effects
	alpha_factor = 1 - torch.exp((dx - 1) / (self.alpha + 1e-4))
	loss *= alpha_factor
	return loss.mean()


	class FocalLoss(nn.Module):
	# Wraps focal loss around existing loss_fcn(), i.e. criteria = FocalLoss(nn.BCEWithLogitsLoss(), gamma=1.5)
	def __init__(self, loss_fcn, gamma=1.5, alpha=0.25):
	"""Initializes FocalLoss with specified loss function, gamma, and alpha values; modifies loss reduction to
	'none'.
	"""
	super().__init__()
	self.loss_fcn = loss_fcn # must be nn.BCEWithLogitsLoss()
	self.gamma = gamma
	self.alpha = alpha
	self.reduction = loss_fcn.reduction
	self.loss_fcn.reduction = "none" # required to apply FL to each element

	def forward(self, pred, true,mask, object_loss,patch):
	"""Calculates the focal loss between predicted and true labels using a modified BCEWithLogitsLoss."""

	loss = self.loss_fcn(pred, true)
	if object_loss:
	loss= loss*mask


	# p_t = torch.exp(-loss)
	# loss = self.alpha (1.000001 - p_t) ** self.gamma # non-zero power for gradient stability

	# TF implementation https://github.com/tensorflow/addons/blob/v0.7.1/tensorflow_addons/losses/focal_loss.py
	pred_prob = torch.sigmoid(pred) # prob from logits
	p_t = true * pred_prob + (1 - true) * (1 - pred_prob)
	alpha_factor = true * self.alpha + (1 - true) * (1 - self.alpha)
	modulating_factor = (1.0 - p_t) ** self.gamma
	loss = alpha_factor modulating_factor
	if object_loss:
	if patch:
	if self.reduction == "mean":
	# return loss.mean()
	return loss.sum()/(mask > 0).sum().item()
	elif self.reduction == "sum":
	return loss.sum()
	else:
	if self.reduction == "mean":
	return loss.mean()
	elif self.reduction == "sum":
	return loss.sum()
	else:
	if self.reduction == "mean":
	return loss.mean()
	elif self.reduction == "sum":
	return loss.sum()

	return loss


	class QFocalLoss(nn.Module):
	# Wraps Quality focal loss around existing loss_fcn(), i.e. criteria = FocalLoss(nn.BCEWithLogitsLoss(), gamma=1.5)
	def __init__(self, loss_fcn, gamma=1.5, alpha=0.25):
	"""Initializes Quality Focal Loss with given loss function, gamma, alpha; modifies reduction to 'none'."""
	super().__init__()
	self.loss_fcn = loss_fcn # must be nn.BCEWithLogitsLoss()
	self.gamma = gamma
	self.alpha = alpha
	self.reduction = loss_fcn.reduction
	self.loss_fcn.reduction = "none" # required to apply FL to each element

	def forward(self, pred, true):
	"""Computes the focal loss between `pred` and `true` using BCEWithLogitsLoss, adjusting for imbalance with
	`gamma` and `alpha`.
	"""
	loss = self.loss_fcn(pred, true)

	pred_prob = torch.sigmoid(pred) # prob from logits
	alpha_factor = true * self.alpha + (1 - true) * (1 - self.alpha)
	modulating_factor = torch.abs(true - pred_prob) ** self.gamma
	loss = alpha_factor modulating_factor

	if self.reduction == "mean":
	return loss.mean()
	elif self.reduction == "sum":
	return loss.sum()
	else: # 'none'
	return loss


	class ComputeLoss:
	sort_obj_iou = False

	# Compute losses
	def __init__(self, model, autobalance=False):
	"""Initializes ComputeLoss with model and autobalance option, autobalances losses if True."""
	device = next(model.parameters()).device # get model device
	h = model.hyp # hyperparameters

	# Define criteria
	BCEcls = nn.BCEWithLogitsLoss(pos_weight=torch.tensor([h["cls_pw"]], device=device))
	BCEobj = nn.BCEWithLogitsLoss(pos_weight=torch.tensor([h["obj_pw"]], device=device))

	# Class label smoothing https://arxiv.org/pdf/1902.04103.pdf eqn 3
	self.cp, self.cn = smooth_BCE(eps=h.get("label_smoothing", 0.0)) # positive, negative BCE targets

	# Focal loss
	g = h["fl_gamma"] # focal loss gamma
	if g > 0:
	BCEcls, BCEobj = FocalLoss(BCEcls, g), FocalLoss(BCEobj, g)

	m = de_parallel(model).model[-1] # Detect() module
	self.balance = {3: [4.0, 1.0, 0.4]}.get(m.nl, [4.0, 1.0, 0.25, 0.06, 0.02]) # P3-P7
	self.ssi = list(m.stride).index(16) if autobalance else 0 # stride 16 index
	self.BCEcls, self.BCEobj, self.gr, self.hyp, self.autobalance = BCEcls, BCEobj, 1.0, h, autobalance
	self.na = m.na # number of anchors
	self.nc = m.nc # number of classes
	self.nl = m.nl # number of layers
	self.anchors = m.anchors
	self.stride = m.stride
	self.device = device
	self.grid = [torch.empty(0) for _ in range(self.nl)] # init grid
	self.anchor_grid = [torch.empty(0) for _ in range(self.nl)]

	def __call__(self, p, targets, feat,epoch): # predictions, targets
	"""Performs forward pass, calculating class, box, and object loss for given predictions and targets."""
	epsilon = 1e-12
	p_lcls = torch.zeros(1, device=self.device) # class loss
	p_lbox = torch.zeros(1, device=self.device) # box loss
	p_lobj = torch.zeros(1, device=self.device)
	f_lcls = torch.zeros(1, device=self.device) # class loss
	f_lbox = torch.zeros(1, device=self.device) # box loss
	f_lobj = torch.zeros(1, device=self.device)

	# target= targets[:,:6]
	# masked_values_patch = torch.zeros(p, dtype=p.dtype, device=self.device)
	p_region= torch.cat((targets[:,0:1],targets[:,6:10]),dim=1)
	p_n=[]
	complete_patch_mask= []
	for i in range(self.nl):
	selected_ratio=[8,16,32]
	# size_ratio=[(32,32),(16,16),(8,8)]


	unique_boxes, _ = torch.unique(p_region, dim=0, return_inverse=True)
	extracted_slices= []
	patch_mask=[]
	for l in range(p[i].shape[0]):
	_, x1, y1, x2, y2 = unique_boxes[l].int()
	x1, x2, y1, y2 = int(x1 / selected_ratio[i]), int(x2 / selected_ratio[i]), int(y1 / selected_ratio[i]), int(y2 / selected_ratio[i])

	# Create a mask of zeros
	mask = torch.zeros_like(p[i][l])

	# Set the specified region to 1
	mask[:, y1:y2, x1:x2, :] = 1

	# Apply the mask to p[i][l]
	masked_p = p[i][l] * mask




	# import cv2

	# import numpy as np
	# roi_aligned_features= masked_p[:,:,:,-1].detach().cpu().numpy()
	# roi_aligned_features_numpy = roi_aligned_features
	# roi_aligned_features_numpy[roi_aligned_features_numpy < 0] *= -1
	# roi_aligned_features_numpy = np.transpose(roi_aligned_features_numpy, (1, 2, 0))

	# # Write the NumPy array to an image file using OpenCV
	# processed_array = ((roi_aligned_features_numpy) * 255).astype(np.uint8)
	# #processed_array = np.squeeze(processed_array)

	# # Write the processed image using OpenCV
	# save_path = f"{l}_output.jpg"
	# cv2.imwrite(save_path, processed_array)











	# Extract the masked slice
	# extracted_slice = masked_p[:, y1:y2, x1:x2, :]

	extracted_slices.append(masked_p.squeeze(0))
	patch_mask.append(mask.squeeze(0))

	p_n.append(torch.stack(extracted_slices, dim=0))
	complete_patch_mask.append(torch.stack(patch_mask, dim=0))




	p_tcls, p_tbox, p_indices, p_anchors = self.build_targets(p_n, targets)

	p_lbox , p_lobj ,p_lcls, p_bs, t_class_all,p_classes_path= self. loss_com_patch(p_tcls, p_tbox, p_indices, p_anchors,p_n,complete_patch_mask)
	pseudo_targets, patch_targets,orignal_targets,pseudo_targets_60_90 = self.pseudo_targets(p, targets)

	mean_sim=0
	# # similarity_loss_patch_2= self.similarity(feat,pseudo_targets_60_90, patch_targets,orignal_targets,0 )
	# # if similarity_loss_patch_2 != torch.zeros(1, device=self.device):
	# # similarity_loss_patch_2= similarity_loss_patch_2.unsqueeze(0)
	# # mean_sim+=1
	if epoch < 20 :
	similarity_loss_patch_3= self.similarity(feat,pseudo_targets_60_90, patch_targets,orignal_targets,1 )
	if similarity_loss_patch_3 != torch.zeros(1, device=self.device):
	similarity_loss_patch_3= similarity_loss_patch_3.unsqueeze(0)
	mean_sim+=1
	if mean_sim > 0:













	similarity_loss_patch= (similarity_loss_patch_3)#+(similarity_loss_patch_3)/mean_sim
	else:
	similarity_loss_patch= (similarity_loss_patch_3)#+(similarity_loss_patch_3)
	if epoch >= 20:
	similarity_loss_patch = torch.zeros(1, device=self.device) # class loss
	# # similarity_loss_patch_4= self.similarity(feat,pseudo_targets_60_90, patch_targets,orignal_targets,2 )
	# # if similarity_loss_patch_4 != torch.zeros(1, device=self.device):
	# # similarity_loss_patch_4= similarity_loss_patch_4.unsqueeze(0)
	# # mean_sim+=1

	if len(pseudo_targets) > 0:
	f_tcls, f_tbox, f_indices, f_anchors = self.build_targets(p, pseudo_targets)
	f_lbox , f_lobj ,f_lcls, p_classes= self. loss_com_background(f_tcls, f_tbox, f_indices, f_anchors,p)

	# i_tcls, i_tbox, i_indices, i_anchors = self.build_targets(p, targets)

	# # i_class_all= self.loss_com_image(i_tcls, i_tbox, i_indices, i_anchors,p)





	# # kl_loss= ((self.compute_kl_loss(t_class_all,p_classes_path))*0.2) + epsilon



	#sim_loss






	if len(pseudo_targets) > 0:
	lbox= p_lbox + (f_lbox*0.1)
	lobj= p_lobj +(f_lobj*0.1)
	lcls= (p_lcls)+(f_lcls0.1)+(similarity_loss_patch0.1) #+ (kl_loss)
	# lcls= similarity_loss_patch

	else:
	lbox= p_lbox
	lobj= p_lobj
	lcls= p_lcls+(similarity_loss_patch*0.1)#+kl_loss

	if epoch == 29:
	lbox= p_lbox
	lobj= p_lobj
	lcls= p_lcls
	# if similarity_loss_patch != torch.zeros(1, device=self.device):
	# similarity_loss_patch= similarity_loss_patch.unsqueeze(0)
	# return (kl_loss) * p_bs, torch.cat((kl_loss.unsqueeze(0),p_lobj, p_lcls)).detach()
	return (lbox + lobj + lcls) * p_bs, torch.cat((p_lbox, p_lobj, p_lcls)).detach()
	# return (lbox + lobj + lcls) * p_bs, torch.cat((p_lbox, p_lobj, p_lcls,f_lbox, f_lobj, f_lcls, similarity_loss_patch)).detach()
	def loss_com_patch (self,tcls, tbox, indices, anchors,p_n,complete_patch_masks):
	lcls = torch.zeros(1, device=self.device) # class loss
	lbox = torch.zeros(1, device=self.device) # box loss
	lobj = torch.zeros(1, device=self.device) # object loss84653940

	# targets
	t_classes_path=[]
	p_classes_path=[]

	# Losses
	for i, (pi, pq) in enumerate(zip(p_n, complete_patch_masks)): # layer index, layer predictions
	b, a, gj, gi = indices[i] # image, anchor, gridy, gridx
	tobj = torch.zeros(pi.shape[:4], dtype=pi.dtype, device=self.device) # target obj

	n = b.shape[0] # number of targets
	if n:
	# pxy, pwh, _, pcls = pi[b, a, gj, gi].tensor_split((2, 4, 5), dim=1) # faster, requires torch 1.8.0
	pxy, pwh, _, pcls = pi[b, a, gj, gi].split((2, 2, 1, self.nc), 1) # target-subset of predictions

	# Regression
	pxy = pxy.sigmoid() * 2 - 0.5
	pwh = (pwh.sigmoid() * 2) ** 2 * anchors[i]
	pbox = torch.cat((pxy, pwh), 1) # predicted box
	iou = bbox_iou(pbox, tbox[i], CIoU=True).squeeze() # iou(prediction, target)
	lbox += (1.0 - iou).mean() # iou loss

	# Objectness
	iou = iou.detach().clamp(0).type(tobj.dtype)
	if self.sort_obj_iou:
	j = iou.argsort()
	b, a, gj, gi, iou = b[j], a[j], gj[j], gi[j], iou[j]
	if self.gr < 1:
	iou = (1.0 - self.gr) + self.gr * iou
	tobj[b, a, gj, gi] = iou # iou ratio

	# Classification
	if self.nc > 1: # cls loss (only if multiple classes)
	t = torch.full_like(pcls, self.cn, device=self.device) # targets
	t[range(n), tcls[i]] = self.cp
	lcls += self.BCEcls(pcls, t,pcls,object_loss=False, patch= False) # BCE
	# t_classes_path.append(t)
	# p_classes_path.append(pcls)
	# Append targets to text file
	# with open('targets.txt', 'a') as file:
	# [file.write('%11.5g ' * 4 % tuple(x) + '\n') for x in torch.cat((txy[i], twh[i]), 1)]

	obji = self.BCEobj(pi[..., 4], tobj,pq[..., 4],object_loss=True,patch= True)
	lobj += obji * self.balance[i] # obj loss
	if self.autobalance:
	self.balance[i] = self.balance[i] * 0.9999 + 0.0001 / obji.detach().item()


	if self.autobalance:
	self.balance = [x / self.balance[self.ssi] for x in self.balance]
	lbox *= self.hyp["box"]
	lobj *= self.hyp["obj"]
	lcls *= self.hyp["cls"]
	bs = tobj.shape[0] # batch size
	# sim_loss= torch.tensor(0.00, dtype=torch.float16, device='cuda:0')
	# kl_loss= torch.tensor(0.00, dtype=torch.float16, device='cuda:0')
	# torch.tensor(0.001, dtype=torch.float16, device='cuda:0')
	# t_classes_path= torch.cat(t_classes_path)
	# p_classes_path=torch.cat(p_classes_path)
	return lbox , lobj ,lcls, bs ,t_classes_path,p_classes_path

	def loss_com_background (self,tcls, tbox, indices, anchors,p):
	lcls = torch.zeros(1, device=self.device) # class loss
	lbox = torch.zeros(1, device=self.device) # box loss
	lobj = torch.zeros(1, device=self.device) # object loss
	p_classes_all=[]
	# targets
	# gt_path= paths[0].split("/")[-1].split(".")[0]
	# gt_part=gt_path.split("_")
	# gt_part[3]="1000"
	# del gt_part[2]
	# gt_path= '_'.join(gt_part)
	# x_prediction=np.load(f"100x_GT/{gt_path}.npy", allow_pickle=True)

	# Losses
	for i, pi in enumerate(p): # layer index, layer predictions
	b, a, gj, gi = indices[i] # image, anchor, gridy, gridx
	tobj = torch.zeros(pi.shape[:4], dtype=pi.dtype, device=self.device) # target obj

	n = b.shape[0] # number of targets
	if n:
	# pxy, pwh, _, pcls = pi[b, a, gj, gi].tensor_split((2, 4, 5), dim=1) # faster, requires torch 1.8.0
	pxy, pwh,pobj, pcls = pi[b, a, gj, gi].split((2, 2, 1, self.nc), 1) # target-subset of predictions

	# Regression
	pxy = pxy.sigmoid() * 2 - 0.5
	pwh = (pwh.sigmoid() * 2) ** 2 * anchors[i]
	pbox = torch.cat((pxy, pwh), 1) # predicted box
	iou = bbox_iou(pbox, tbox[i], CIoU=True).squeeze() # iou(prediction, target)
	lbox += (1.0 - iou).mean() # iou loss

	# Objectness
	iou = iou.detach().clamp(0).type(tobj.dtype)
	if self.sort_obj_iou:
	j = iou.argsort()
	b, a, gj, gi, iou = b[j], a[j], gj[j], gi[j], iou[j]
	if self.gr < 1:
	iou = (1.0 - self.gr) + self.gr * iou
	tobj[b, a, gj, gi] = iou # iou ratio

	# Classification
	if self.nc > 1: # cls loss (only if multiple classes)
	t = torch.full_like(pcls, self.cn, device=self.device) # targets
	t[range(n), tcls[i]] = self.cp
	lcls += self.BCEcls(pcls, t ,pcls,object_loss=False,patch= False) # BCE
	p_classes_all.append(pcls)

	# Append targets to text file
	# with open('targets.txt', 'a') as file:
	# [file.write('%11.5g ' * 4 % tuple(x) + '\n') for x in torch.cat((txy[i], twh[i]), 1)]
	# tobj[b, a, gj, gi] = iou # iou ratio
	mask = torch.zeros_like(pi[..., 4], dtype=torch.bool)
	mask[b, a, gj, gi] = True

	# Apply the mask to pi[..., 4]
	masked_values = torch.zeros(pi.shape[:4], dtype=pi.dtype, device=self.device)

	masked_values[mask] = pi[..., 4][mask]

	# masked_values[mask] = pi[..., 4][mask]
	obji = self.BCEobj(masked_values, tobj,mask,object_loss=True,patch= False)
	# obji*=
	lobj += obji * self.balance[i] # obj loss
	if self.autobalance:
	self.balance[i] = self.balance[i] * 0.9999 + 0.0001 / obji.detach().item()

	if self.autobalance:
	self.balance = [x / self.balance[self.ssi] for x in self.balance]
	# lbox *= self.hyp["box"]
	# lobj *= self.hyp["obj"]
	# lcls *= self.hyp["cls"]
	bs = tobj.shape[0] # batch size
	# sim_loss= torch.tensor(0.00, dtype=torch.float16, device='cuda:0')
	# kl_loss= torch.tensor(0.00, dtype=torch.float16, device='cuda:0')
	# torch.tensor(0.001, dtype=torch.float16, device='cuda:0')
	p_classes_all= torch.cat(p_classes_all, dim=0)

	return lbox , lobj ,lcls, p_classes_all

	def loss_com_image (self,tcls, tbox, indices, anchors,p):
	image_classes_all=[]

	# Losses
	for i, pi in enumerate(p): # layer index, layer predictions
	b, a, gj, gi = indices[i] # image, anchor, gridy, gridx
	# tobj = torch.zeros(pi.shape[:4], dtype=pi.dtype, device=self.device) # target obj

	n = b.shape[0] # number of targets
	if n:
	# pxy, pwh, _, pcls = pi[b, a, gj, gi].tensor_split((2, 4, 5), dim=1) # faster, requires torch 1.8.0
	pxy, pwh,pobj, pcls = pi[b, a, gj, gi].split((2, 2, 1, self.nc), 1) # target-subset of predictions
	image_classes_all.append(pcls)
	image_classes_all= torch.cat(image_classes_all)

	return image_classes_all



	def build_targets(self, p, target):
	"""Prepares model targets from input targets (image,class,x,y,w,h) for loss computation, returning class, box,
	indices, and anchors.

	"""

	targets= target[:,:6]

	na, nt = self.na, targets.shape[0] # number of anchors, targets
	tcls, tbox, indices, anch = [], [], [], []
	gain = torch.ones(7, device=self.device) # normalized to gridspace gain
	ai = torch.arange(na, device=self.device).float().view(na, 1).repeat(1, nt) # same as .repeat_interleave(nt)
	targets = torch.cat((targets.repeat(na, 1, 1), ai[..., None]), 2) # append anchor indices

	g = 0.5 # bias
	off = (
	torch.tensor(
	[
	[0, 0],
	[1, 0],
	[0, 1],
	[-1, 0],
	[0, -1], # j,k,l,m
	# [1, 1], [1, -1], [-1, 1], [-1, -1], # jk,jm,lk,lm
	],
	device=self.device,
	).float()
	* g
	) # offsets

	for i in range(self.nl):
	anchors, shape = self.anchors[i], p[i].shape
	gain[2:6] = torch.tensor(shape)[[3, 2, 3, 2]] # xyxy gain

	# Match targets to anchors
	t = targets* gain # shape(3,n,7)
	if nt:
	# Matches
	r = t[..., 4:6] / anchors[:, None] # wh ratio
	j = torch.max(r, 1 / r).max(2)[0] < self.hyp["anchor_t"] # compare
	# j = wh_iou(anchors, t[:, 4:6]) > model.hyp['iou_t'] # iou(3,n)=wh_iou(anchors(3,2), gwh(n,2))
	t = t[j] # filter

	# Offsets
	gxy = t[:, 2:4] # grid xy
	gxi = gain[[2, 3]] - gxy # inverse
	j, k = ((gxy % 1 < g) & (gxy > 1)).T
	l, m = ((gxi % 1 < g) & (gxi > 1)).T
	j = torch.stack((torch.ones_like(j), j, k, l, m))
	t = t.repeat((5, 1, 1))[j]
	offsets = (torch.zeros_like(gxy)[None] + off[:, None])[j]
	else:
	t = targets[0]
	offsets = 0

	# Define
	bc, gxy, gwh, a = t.chunk(4, 1) # (image, class), grid xy, grid wh, anchors
	a, (b, c) = a.long().view(-1), bc.long().T # anchors, image, class
	gij = (gxy - offsets).long()
	gi, gj = gij.T # grid indices

	# Append
	indices.append((b, a, gj.clamp_(0, shape[2] - 1), gi.clamp_(0, shape[3] - 1))) # image, anchor, grid
	tbox.append(torch.cat((gxy - gij, gwh), 1)) # box
	anch.append(anchors[a]) # anchors
	tcls.append(c) # class

	return tcls, tbox, indices, anch





	def compute_kl_loss(self, tcls, pred):
	# pcls_sigmoid = torch.sigmoid(pred)
	tcls_sigmoid = tcls
	data2 = self.gumbel_softmax(pred, tau=1, hard=False)

	# Get the indices of the maximum values along each row
	# max_indices = torch.argmax(pcls_sigmoid, dim=1)

	# Create a new tensor using these indices
	# new_tensor2 = max_indices.device
	# new_tensor2= new_tensor2.to(dtype=torch.float)
	# new_tensor2.requires_grad_(True)

	# Combine tensor values into a single list for both sets
	# data1 = []
	data1 = [torch.tensor(lst) for lst in tcls]

	# Stack tensors along a new dimension (dimension 0 by default)
	stacked_data1= torch.stack(data1)

	# Perform element-wise sum along dimension 0
	data1_counts = torch.sum(stacked_data1, dim=0).detach()

	# data1= []
	# data2 = pcls_softmax #new_tensor2.cpu().tolist()
	# for tensor in tcls_sigmoid:
	# data1.extend(tensor.cpu().tolist())
	# # for tensord in pcls_sigmoid:
	# # data2.extend(tensord.cpu().tolist())


	# # Convert to probability distributions
	# data1_counts = np.bincount(data1, minlength=14)
	# data1_counts = torch.sum(data1, dim=0)
	data2_counts = torch.sum(data2, dim=0)
	# data2_counts = np.bincount(data2, minlength=14)

	epsilon = 1e-12

	# Normalize to get probabilities
	data1_probs = (data1_counts+epsilon) / sum(data1_counts)
	data2_probs = (data2_counts+epsilon) / sum(data2_counts)

	# Convert to tensors
	data1_probs = torch.tensor(data1_probs, device='cuda:0', dtype=torch.float, requires_grad=True)
	# data2_probs = torch.tensor(data2_probs, device='cuda:0', dtype=torch.float, requires_grad=True)

	# Compute KL divergence
	kl_div = F.kl_div(data1_probs.log(), data2_probs, reduction='batchmean')
	return kl_div
	def gumbel_softmax(self,logits, tau=1, hard=False, eps=1e-10):
	gumbels = -torch.empty_like(logits).exponential_().log() # ~Gumbel(0,1)
	gumbels = (logits + gumbels) / tau # ~Gumbel(logits,tau)
	y_soft = gumbels.softmax(dim=-1)

	if hard:
	# Straight through
	index = y_soft.max(dim=-1, keepdim=True)[1]
	y_hard = torch.zeros_like(logits).scatter_(-1, index, 1.0)
	ret = y_hard - y_soft.detach() + y_soft
	else:
	# Reparameterization trick
	ret = y_soft
	return ret

	def make_grid(self, nx=20, ny=20, i=0):
	d = self.anchors[i].device
	t = self.anchors[i].dtype
	shape = 1, self.na, ny, nx, 2 # grid shape
	y, x = torch.arange(ny, device=d, dtype=t), torch.arange(nx, device=d, dtype=t)
	yv, xv = torch.meshgrid(y, x, indexing='ij') #if torch_1_10 else torch.meshgrid(y, x) # torch>=0.7 compatibility
	grid = torch.stack((xv, yv), 2).expand(shape) - 0.5 # add grid offset, i.e. y = 2.0 * x - 0.5
	anchor_grid = (self.anchors[i] * self.stride[i]).view((1, self.na, 1, 1, 2)).expand(shape)
	return grid, anchor_grid
	def calculate_overlap(self,box1, box2):
	"""Calculate the overlap area between two bounding boxes."""
	# Extracting coordinates of the intersection rectangl+e
	box1=box1*640
	box2=box2*640
	x_left = torch.max(box1[0] - box1[2] / 2, box2[0] - box2[2] / 2)
	y_top = torch.max(box1[1] - box1[3] / 2, box2[1] - box2[3] / 2)
	x_right = torch.min(box1[0] + box1[2] / 2, box2[0] + box2[2] / 2)
	y_bottom = torch.min(box1[1] + box1[3] / 2, box2[1] + box2[3] / 2)

	# Calculate width and height of the intersection rectangle
	width = torch.clamp(x_right - x_left, min=0)
	height = torch.clamp(y_bottom - y_top, min=0)

	# If the intersection is valid (non-negative area), return the area
	intersection_area = width * height
	return intersection_area
	def merge_tensors(self,tensor1, tensor_9):
	"""Merge two tensors while keeping all values from tensor1 and discarding overlapped values from tensor2."""
	without_patch_tensor = []
	patch_tensor= []
	tensor2= tensor_9[:,:6]


	# Add all bounding boxes from tensor1
	# merged_tensor.extend(tensor1)

	# Iterate through each bounding box in tensor2
	for box2 in tensor2:
	overlap = False

	# Check for overlap with each bounding box in tensor1
	for box1 in tensor1:
	if box1[0] == box2[0]:
	if self.calculate_overlap(box1[2:], box2[2:]) > 100:
	overlap = True
	break

	# If there's no overlap, add the bounding box from tensor2
	if overlap:
	patch_tensor.append(box2)
	if not overlap:
	without_patch_tensor.append(box2)
	if without_patch_tensor:
	without_patch_tensor = torch.stack(without_patch_tensor)
	without_patch_tensor = without_patch_tensor[without_patch_tensor[:, 0].argsort()]
	# else:
	# merged_tensor= torch.tensor(merged_tensor).device

	return without_patch_tensor,patch_tensor





	def pseudo_targets(self, p, target):
	"""Prepares model targets from input targets (image,class,x,y,w,h) for loss computation, returning class, box,
	indices, and anchors.








	"""

	# targets= target[:,:6]

	# p_region= torch.cat((target[:,0:1],target[:,6:10]),dim=1)
	# p_n=[]
	# for i in range(self.nl):
	# selected_ratio=[8,16,32]
	# size_ratio=[(32,32),(16,16),(8,8)]


	# unique_boxes, _ = torch.unique(p_region, dim=0, return_inverse=True)
	# extracted_slices= []
	# for l in range(p[i].shape[0]):
	# _, x1, y1, x2, y2 = unique_boxes[l].int()
	# x1, x2, y1, y2 = int(x1 / selected_ratio[i]), int(x2 / selected_ratio[i]), int(y1 / selected_ratio[i]), int(y2 / selected_ratio[i])

	# # Create a mask of zeros
	# mask = torch.ones_like(p[i][l])

	# # Set the specified region to 1
	# mask[:, y1:y2, x1:x2, :] = 0

	# # Apply the mask to p[i][l]
	# masked_p = p[i][l] * mask

	# # Extract the masked slice
	# # extracted_slice = masked_p[:, y1:y2, x1:x2, :]

	# extracted_slices.append(masked_p.squeeze(0))

	# p_n.append(torch.stack(extracted_slices, dim=0))





	z=[]

	p_clone= p.copy()
	for i in range(self.nl):
	bs, self.na, ny, nx, self.no = p_clone[i].shape

	xy, wh, conf = p_clone[i].sigmoid().split((2, 2, self.nc + 1), 4)
	self.grid[i], self.anchor_grid[i] = self.make_grid(nx, ny, i)
	xy = (xy * 2 + self.grid[i]) * self.stride[i] # xy
	wh = (wh * 2) ** 2 * self.anchor_grid[i] # wh
	y = torch.cat((xy, wh, conf), 4)
	z.append(y.view(bs, self.na * nx * ny, self.no))

	z_new= torch.cat(z, 1)

	lb = [targets_lb[targets_lb[:, 0] == i, 1:] for i in range(range(p_clone[0].shape[0]))] if False else []






	train_preds = non_max_suppression_ps(
	z_new.detach().cpu(), 0.5, 0.2, labels=lb, multi_label=False, agnostic=True, max_det=300
	)

	# del sgrid
	# del anchor_grid

	train_pseudo_labels = [torch.tensor([]) for _ in range(len(train_preds))]
	train_pseudo_labels_60_90 = [torch.tensor([]) for _ in range(len(train_preds))]

	for num, preds in enumerate(train_preds):
	for bbox in preds:
	# print((bbox[2] - bbox[0]) * (bbox[3] - bbox[1]))
	if ((bbox[2] - bbox[0]) * (bbox[3] - bbox[1])) > 10:
	# print(bbox[4])
	if bbox[4] > 0.95:

	last_14_values = bbox[-14:].softmax(dim=0)

	# Normalize the values to make them probabilities
	probs = last_14_values / last_14_values.sum()

	# Create a categorical distribution
	dist = torch.distributions.Categorical(probs)

	# Calculate entropy

	entropy = dist.entropy()
	# print(entropy)
	if entropy.item() < 2.7:

	bbox_tensor = torch.tensor(bbox).unsqueeze(0) # Convert bbox to tensor and add a batch dimension
	train_pseudo_labels[num] = torch.cat((train_pseudo_labels[num], bbox_tensor), dim=0)
	# else:
	elif 0.60 < bbox[4] <= 0.95:
	bbox_tensor = torch.tensor(bbox).unsqueeze(0)

	train_pseudo_labels_60_90[num] = torch.cat((train_pseudo_labels_60_90[num], bbox_tensor), dim=0)



	# print(entropy)


	train_pseudo_box = [([]) for _ in range(len(train_pseudo_labels)) ]
	train_pseudo_box_60_90 = [[] for _ in range(len(train_pseudo_labels_60_90))]

	for num2, pred_box in enumerate(train_pseudo_labels):
	for bbox in pred_box:
	# train_pseudo_box[num2].append(bbox[:4].detach().cpu().numpy())
	train_pseudo_box[num2].append(bbox.detach().cpu().numpy())
	for num2, pred_box in enumerate(train_pseudo_labels_60_90):
	for bbox in pred_box:
	train_pseudo_box_60_90[num2].append(bbox.detach().cpu().numpy())


	pesudo_target_list = []
	pesudo_target_list_60_90 = []

	for i, tensor in enumerate(train_pseudo_labels):
	for t in tensor:
	tensor_values = [
	i,
	t[5].item(), # [6]
	torch.tensor(int(t[0].item())), # [0]
	torch.tensor(int(t[1].item())), # [1]
	torch.tensor(int(t[2].item())), # [2]
	torch.tensor(int(t[3].item())) # [3]
	]
	pesudo_target_list.append(tensor_values)

	for i, tensor in enumerate(train_pseudo_labels_60_90):
	for t in tensor:
	tensor_values = [
	i,
	t[5].item(),
	torch.tensor(int(t[0].item())),
	torch.tensor(int(t[1].item())),
	torch.tensor(int(t[2].item())),
	torch.tensor(int(t[3].item()))
	]
	pesudo_target_list_60_90.append(tensor_values)

	# Convert the inner lists to tensors
	pesudo_target_list = [torch.tensor(tensor_values) for tensor_values in pesudo_target_list]
	pesudo_target_list_60_90 = [torch.tensor(tensor_values) for tensor_values in pesudo_target_list_60_90]
	targets_ps= target[:,:6]



	# optimizer_cell_model.zero_grad(

	# Stack the tensors along a new dimension (dimension 0 in this example)
	wp_target=[]
	p_target=[]
	wp_target_60_90=[]

	if pesudo_target_list:
	pesudo_target_list_concatenated = torch.stack(pesudo_target_list, dim=0)

	pesudo_target_list_concatenated= pesudo_target_list_concatenated/torch.tensor([1,1,640,640,640,640])

	x_min, y_min, x_max, y_max = pesudo_target_list_concatenated[:, 2], pesudo_target_list_concatenated[:, 3], pesudo_target_list_concatenated[:, 4], pesudo_target_list_concatenated[:, 5]

	# Calculating x_center, y_center, width, height
	x_center = (x_min + x_max) / 2
	y_center = (y_min + y_max) / 2
	width = x_max - x_min
	height = y_max - y_min

	# Updating the tensor with new values
	pesudo_target_list_concatenated[:, 2] = x_center
	pesudo_target_list_concatenated[:, 3] = y_center
	pesudo_target_list_concatenated[:, 4] = width
	pesudo_target_list_concatenated[:, 5] = height




	pesudo_target_list_concatenated = pesudo_target_list_concatenated.to(target.device)
	wp_target,p_target = self.merge_tensors(targets_ps,pesudo_target_list_concatenated)
	if pesudo_target_list_60_90:
	pesudo_target_list_concatenated_60_90 = torch.stack(pesudo_target_list_60_90, dim=0)
	pesudo_target_list_concatenated_60_90 = pesudo_target_list_concatenated_60_90 / torch.tensor([1, 1, 640, 640, 640, 640])

	x_min, y_min, x_max, y_max = pesudo_target_list_concatenated_60_90[:, 2], pesudo_target_list_concatenated_60_90[:, 3], pesudo_target_list_concatenated_60_90[:, 4], pesudo_target_list_concatenated_60_90[:, 5]

	# Calculating x_center, y_center, width, height
	x_center = (x_min + x_max) / 2
	y_center = (y_min + y_max) / 2
	width = x_max - x_min
	height = y_max - y_min

	# Updating the tensor with new values
	pesudo_target_list_concatenated_60_90[:, 2] = x_center
	pesudo_target_list_concatenated_60_90[:, 3] = y_center
	pesudo_target_list_concatenated_60_90[:, 4] = width
	pesudo_target_list_concatenated_60_90[:, 5] = height

	pesudo_target_list_concatenated_60_90 = pesudo_target_list_concatenated_60_90.to(target.device)
	wp_target_60_90,p_target_60_90 = self.merge_tensors(targets_ps,pesudo_target_list_concatenated_60_90)
	# else:

	return wp_target, p_target, targets_ps,wp_target_60_90
	def calculate_iou(self,bbox1, bbox2):
	"""
	Calculate Intersection over Union (IoU) between two bounding boxes.

	Arguments:
	bbox1 (tuple): Coordinates of the first bounding box in the format (x1, y1, x2, y2).
	bbox2 (tuple): Coordinates of the second bounding box in the format (x1, y1, x2, y2).

	Returns:
	float: Intersection over Union (IoU) between the two bounding boxes.
	"""
	# Extract coordinates of the bounding boxes
	x1_1, y1_1, x2_1, y2_1 = bbox1
	x1_2, y1_2, x2_2, y2_2 = bbox2

	# Calculate the coordinates of the intersection rectangle
	x_left = max(x1_1, x1_2)
	y_top = max(y1_1, y1_2)
	x_right = min(x2_1, x2_2)
	y_bottom = min(y2_1, y2_2)

	# If there's no intersection, return 0
	if x_right < x_left or y_bottom < y_top:
	return 0.0

	# Calculate the area of intersection rectangle
	intersection_area = (x_right - x_left) * (y_bottom - y_top)

	# Calculate the area of both bounding boxes
	bbox1_area = (x2_1 - x1_1) * (y2_1 - y1_1)
	bbox2_area = (x2_2 - x1_2) * (y2_2 - y1_2)

	# Calculate the area of union
	union_area = bbox1_area + bbox2_area - intersection_area

	# Calculate IoU
	iou = intersection_area / union_area

	return iou
	def xywh_to_xyxy(self,xywh):
	x_center, y_center, width, height = xywh
	x_min = x_center - width / 2
	y_min = y_center - height / 2
	x_max = x_center + width / 2
	y_max = y_center + height / 2
	return torch.tensor([x_min, y_min, x_max, y_max])
	def compute_similarity(self,feature_maps):
	num_samples = len(feature_maps)
	similarity_matrix = torch.zeros((num_samples, num_samples))

	# Apply average pooling to each feature map
	pooled_feature_maps = [F.avg_pool2d(fm, fm.shape[2]) for fm in feature_maps]

	for i in range(num_samples):
	for j in range(num_samples):
	# Calculate cosine similarity between pooled feature maps
	similarity_matrix[i, j] = F.cosine_similarity(pooled_feature_maps[i].view(-1), pooled_feature_maps[j].view(-1), dim=0)

	return similarity_matrix


	def feat_box(self,pseudo_targets,int_feat, Num_targets,p_layer ):
	pooled_feature_map_pseudo= []
	is_bbox=[]
	for i in range(Num_targets):
	img_num = int(pseudo_targets[i,0].item())

	p2_feature_map =int_feat[p_layer ][img_num]#pred[0][img_num][:,:,:,-1]# imgs[img_num]

	x_center = pseudo_targets[i, 2]
	y_center = pseudo_targets[i, 3]
	width = pseudo_targets[i, 4]
	height = pseudo_targets[i, 5]
	bb = [round(x_center.item(),4), round(y_center.item(),4), round(width.item(),4), round(height.item(),4)]
	p2_feature_shape_tensor = torch.tensor([p2_feature_map.shape[2], p2_feature_map.shape[1],p2_feature_map.shape[2],p2_feature_map.shape[1]]) # reduce_channels_layer = torch.nn.Conv2d(1280, 250, kernel_size=1).to(device)

	p2_normalized_xyxy = self.xywh_to_xyxy(bb)*p2_feature_shape_tensor #imgs.shape[2]

	p2_x_min, p2_y_min, p2_x_max, p2_y_max = get_fixed_xyxy(p2_normalized_xyxy,p2_feature_map)

	batch_index = torch.tensor([0], dtype=torch.float32).to(self.device)

	p2_roi = torch.tensor([p2_x_min, p2_y_min, p2_x_max, p2_y_max], device=self.device).float()
	is_bbox.append(p2_roi)
	# Concatenate the batch index to the bounding box coordinates
	p2_roi_with_batch_index = torch.cat([batch_index, p2_roi])


	# relevant_feature_map = p3_feature_map.unsqueeze(0)[:, :, y_min:y_max, x_min:x_max]
	p2_resized_object = torchvision.ops.roi_align(p2_feature_map.unsqueeze(0), p2_roi_with_batch_index.unsqueeze(0).to(self.device), output_size=(4, 4))
	pooled_feature_map_pseudo.append(p2_resized_object)
	return pooled_feature_map_pseudo, is_bbox
	def similarity(self,int_feat,pseudo_targets, patch_targets, orignal_targets,p_layer):




	losses = []
	Num_targets = len(pseudo_targets)
	Num_targets_label = len(orignal_targets)
	target_featuers, target_box= self.feat_box(orignal_targets,int_feat, Num_targets_label,p_layer)

	# for feat2, label2, is_bb in zip(target_featuers, orignal_targets[:,1],target_box):
	# similarity=0


	# for feat1, label1 , ps_bb in zip( target_featuers, orignal_targets[:,1],target_box ):
	# iou= self.calculate_iou(ps_bb,is_bb)
	# if iou < 0.3:
	# feat2 = F.avg_pool2d(feat2, feat2.shape[2])
	# if label1 == label2:

	# feat1 = F.avg_pool2d(feat1, feat1.shape[2])

	# similarity = cosine_similarity(feat1,feat2).mean()
	# # similarity=(similarity+1)/2
	# losses.append(1-similarity)
	# if label1 != label2:

	# feat1 = F.avg_pool2d(feat1, feat1.shape[2])

	# similarity = cosine_similarity(feat1,feat2).mean()
	# similarity=(similarity+1)/2
	# alpha= 0.2
	# torch.max(torch.tensor(0.0), similarity )
	# losses.append(similarity)




	# # Calculate similarity between features (e.g., cosine similari





	if Num_targets :
	pseudo_featuers,pseudo_box= self.feat_box(pseudo_targets,int_feat, Num_targets,p_layer )


	for feat2, label2, is_bb in zip(pseudo_featuers, pseudo_targets[:,1],pseudo_box):
	#sim=-10

	min_same_class_sim=100
	max_diff_class_sim= 0
	for feat1, label1 , ps_bb in zip( target_featuers, orignal_targets[:,1],target_box ):
	iou= self.calculate_iou(ps_bb,is_bb)
	feat2 = F.avg_pool2d(feat2, feat2.shape[2])
	feat1 = F.avg_pool2d(feat1, feat1.shape[2])

	if iou < 0.3:


	# Calculate similarity between features (e.g., cosine similarity)
	similarity = cosine_similarity(feat1,feat2).mean()
	similarity=(similarity+1) # Normalize

	if label1 == label2:
	if min_same_class_sim > similarity:
	min_same_class_sim = similarity

	else:
	if max_diff_class_sim < similarity:
	max_diff_class_sim = similarity





	# max_similarity=(max_similarity+1)/2
	# Compare labels
	if min_same_class_sim < 100 and max_diff_class_sim > 0:
	loss_value = torch.max(torch.tensor(0.0), min_same_class_sim - (max_diff_class_sim+0.05))
	losses.append(loss_value)
	# Compute loss (e.g., squared difference)
	# loss_sim = torch.mean(torch.abs(torch.tensor(feat1) - torch.tensor(feat2)))
	# losses.append(max_similarity)
	# elif ((max_similarity < 0.30) and (max_label1 == max_label2.item())):
	# # Compute loss (e.g., squared difference)
	# # loss_sim = torch.mean(torch.abs(torch.tensor(feat1) - torch.tensor(feat2)))
	# max_similarity=(max_similarity+1)/2
	# losses.append(1-max_similarity)


	if losses:
	total_loss = (torch.sum(torch.stack(losses))/len(losses) )
	else:
	total_loss= torch.zeros(1, device=self.device)
	return(total_loss)

	# for feat2, label2, is_bb in zip(pseudo_featuers, pseudo_targets[:,1],pseudo_box):
	# sim=-10


	# for feat1_gr, label1 , ps_bb in zip( target_featuers, orignal_targets[:,1],target_box ):
	# feat1 = feat1_gr.clone().detach()
	# iou= self.calculate_iou(ps_bb,is_bb)
	# feat2 = F.avg_pool2d(feat2, feat2.shape[2])
	# feat1 = F.avg_pool2d(feat1, feat1.shape[2])

	# if iou < 0.3:


	# # Calculate similarity between features (e.g., cosine similarity)
	# similarity = cosine_similarity(feat1,feat2).mean()
	# if similarity > sim:
	# sim=similarity
	# max_similarity = similarity
	# max_label1 =label1
	# max_label2= label2


	# # max_similarity=(max_similarity+1)/2
	# # Compare labels
	# if ((max_similarity > 0.95) and (max_label1 != max_label2)):
	# # Compute loss (e.g., squared difference)
	# # loss_sim = torch.mean(torch.abs(torch.tensor(feat1) - torch.tensor(feat2)))
	# losses.append(max_similarity)
	# elif ((max_similarity < 0.50) and (max_label1 == max_label2.item())):
	# # Compute loss (e.g., squared difference)
	# # loss_sim = torch.mean(torch.abs(torch.tensor(feat1) - torch.tensor(feat2)))
	# max_similarity=(max_similarity+1)/2
	# losses.append(1-max_similarity)


	# if losses:
	# total_loss = (torch.sum(torch.stack(losses))/len(losses) )
	# else:
	# total_loss= torch.zeros(1, device=self.device)
	# return(total_loss)