Spaces:

Pranjal2041
/

DenseBreastCancerDetection

Sleeping

App Files Files Community

DenseBreastCancerDetection / DenseMammogram /auc_by_pranjal.py

Pranjal2041

Initial demo

970a7a2 over 1 year ago

raw

history blame contribute delete

4.16 kB

	import os
	from os.path import join
	import glob
	from sklearn.metrics import roc_auc_score, roc_curve
	import sys

	def file_to_score(file):
	try:
	content = open(file, 'r').readlines()
	st = 0
	if len(content) == 0:
	# Empty File Should Return []
	return 0.
	if content[0].split()[0].isalpha():
	st = 1
	return max([float(line.split()[st]) for line in content])
	except FileNotFoundError:
	print(f'No Corresponding Box Found for file {file}, using [] as preds')
	return []
	except Exception as e:
	print('Some Error',e)
	return []

	# Create the image dict
	def generate_image_dict(preds_folder_name='preds_42',
	root_fol='/home/krithika_1/densebreeast_datasets/AIIMS_C1',
	mal_path=None, ben_path=None, gt_path=None,
	mal_img_path = None, ben_img_path = None
	):

	mal_path = join(root_fol, mal_path) if mal_path else join(
	root_fol, 'mal', preds_folder_name)
	ben_path = join(root_fol, ben_path) if ben_path else join(
	root_fol, 'ben', preds_folder_name)
	mal_img_path = join(root_fol, mal_img_path) if mal_img_path else join(
	root_fol, 'mal', 'images')
	ben_img_path = join(root_fol, ben_img_path) if ben_img_path else join(
	root_fol, 'ben', 'images')
	gt_path = join(root_fol, gt_path) if gt_path else join(
	root_fol, 'mal', 'gt')


	'''
	image_dict structure:
	'image_name(without txt/png)' : {'gt' : [[...]], 'preds' : score}
	'''
	image_dict = dict()

	# GT Might be sightly different from images, therefore we will index gts based on
	# the images folder instead.
	for file in os.listdir(mal_img_path):
	# for file in glob.glob(join(gt_path, '*.txt')):
	if not file.endswith('.png'):
	continue
	file = file[:-4] + '.txt'
	file = join(gt_path, file)
	key = os.path.split(file)[-1][:-4]
	image_dict[key] = dict()
	image_dict[key]['gt'] = 1.
	image_dict[key]['preds'] = 0.

	for file in glob.glob(join(mal_path, '*.txt')):
	key = os.path.split(file)[-1][:-4]
	assert key in image_dict
	image_dict[key]['preds'] = file_to_score(file)

	for file in os.listdir(ben_img_path):
	# for file in glob.glob(join(ben_path, '*.txt')):
	if not file.endswith('.png'):
	continue

	file = file[:-4] + '.txt'
	file = join(ben_path, file)
	key = os.path.split(file)[-1][:-4]
	# if key == 'Calc-Test_P_00353_LEFT_CC' or key == 'Calc-Training_P_00600_LEFT_CC':
	# continue
	if key in image_dict:
	print(key)
	print('SHIT')
	continue
	# assert key not in image_dict
	image_dict[key] = dict()
	image_dict[key]['preds'] = file_to_score(file)
	image_dict[key]['gt'] = 0.
	return image_dict

	def get_auc_score_from_imdict(image_dict):
	keys = list(image_dict.keys())
	y = [image_dict[k]['gt']for k in keys]
	preds = [image_dict[k]['preds']for k in keys]
	return roc_auc_score(y, preds)

	def get_accuracy_from_imdict(image_dict, thresh = 0.3):
	keys = list(image_dict.keys())
	ys = [image_dict[k]['gt']for k in keys]
	preds = [image_dict[k]['preds']for k in keys]
	acc = 0
	for y,pred in zip(ys,preds):
	if pred < thresh and y == 0.:
	acc+=1
	elif pred > thresh and y == 1.:
	acc+=1
	return acc/len(preds)


	def get_auc_score(preds_image_folder, root_fol, retAcc = False, acc_thresh = 0.3):
	im_dict = generate_image_dict(preds_image_folder, root_fol = root_fol)
	if retAcc:
	return get_auc_score_from_imdict(im_dict), get_accuracy_from_imdict(im_dict, acc_thresh)
	else:
	return get_auc_score_from_imdict(im_dict)

	if __name__ == '__main__':
	seed = '42' if len(sys.argv)== 1 else sys.argv[1]

	root_fol = '../bilateral_new/MammoDatasets/AIIMS_highres_reliable/test'

	auc_score = get_auc_score(f'preds_{seed}',root_fol)
	print(f'ROC AUC Score: {auc_score}')