@misc{pokhrel2024ncddnearestcentroiddistance,
title={NCDD: Nearest Centroid Distance Deficit for Out-Of-Distribution Detection in
Gastrointestinal Vision},
author={Sandesh Pokhrel and Sanjay Bhandari and Sharib Ali and Tryphon Lambrou and Anh
Nguyen and Yash Raj Shrestha and Angus Watson and Danail Stoyanov and Prashnna Gyawali
and Binod Bhattarai},
year={2024},
eprint={2412.01590},
archivePrefix={arXiv},
primaryClass={cs.CV},
url={https://arxiv.org/abs/2412.01590},
}
@misc{khanal2025hallucinationawaremultimodalbenchmarkgastrointestinal,
title={Hallucination-Aware Multimodal Benchmark for Gastrointestinal Image Analysis with Large Vision-Language Models},
author={Bidur Khanal and Sandesh Pokhrel and Sanjay Bhandari and Ramesh Rana and Nikesh Shrestha and Ram Bahadur Gurung and Cristian Linte and Angus Watson and Yash Raj Shrestha and Binod Bhattarai},
year={2025},
eprint={2505.07001},
archivePrefix={arXiv},
primaryClass={cs.CV},
url={https://arxiv.org/abs/2505.07001},
}
To facilitate VLM research on gastrointestinal (GI) image analysis and study hallucination, we curate a multimodal image-text GI dataset: Gut-VLM. This dataset is created using a two-stage pipeline: first, descriptive medical reports of Kvasir-v2 images are generated using ChatGPT, which introduces some hallucinated or incorrect texts. In the second stage, medical experts systematically review these reports, and identify and correct potential inaccuracies to ensure high-quality, clinically reliable annotations.
Unlike traditional datasets that contain only descriptive texts, our dataset also features tags identifying hallucinated sentences and their corresponding corrections. A common approach to reducing hallucination in VLM is to finetune the model on a small-scale, problem-specific dataset. However, we take a different strategy using our dataset. Instead of finetuning the VLM solely for generating textual reports, we finetune it to detect and correct hallucinations, an approach we call hallucination-aware finetuning. Our results show that this approach is better than simply finetuning for descriptive report generation. Additionally, we conduct an extensive evaluation of state-of-the-art VLMs across several metrics, establishing a benchmark.
https://github.com/bhattarailab/Hallucination-Aware-VLM
@misc{}
Multimodal Federated Learning With Missing Modalities through Feature Imputation Network
@misc{poudel2025multimodalfederatedlearningmissing,
title={Multimodal Federated Learning With Missing Modalities through Feature Imputation Network},
author={Pranav Poudel and Aavash Chhetri and Prashnna Gyawali and Georgios Leontidis and Binod Bhattarai},
year={2025},
eprint={2505.20232},
archivePrefix={arXiv},
primaryClass={cs.LG},
url={https://arxiv.org/abs/2505.20232},
}
https://github.com/bhattarailab/FedFeatGen
NERO: Explainable Out-of-Distribution Detection with Neuron-level Relevance
@misc{chhetri2025neroexplainableoutofdistributiondetection,
title={NERO: Explainable Out-of-Distribution Detection with Neuron-level Relevance},
author={Anju Chhetri and Jari Korhonen and Prashnna Gyawali and Binod Bhattarai},
year={2025},
eprint={2506.15404},
archivePrefix={arXiv},
primaryClass={cs.CV},
url={https://arxiv.org/abs/2506.15404},
}
@article{brainsci15050481,
title={Assistive Artificial Intelligence in Epilepsy and Its Impact on Epilepsy Care in
Low- and Middle-Income Countries},
author={Koirala, Nabin and Adhikari, Shishir Raj and Adhikari, Mukesh and Yadav, Taruna
and Anwar, Abdul Rauf and Ciolac, Dumitru and Shrestha, Bibhusan and Adhikari, Ishan and
Khanal, Bishesh and Muthuraman, Muthuraman},
year={2025},
journal={Brain Sciences},
doi = {10.3390/brainsci15050481},
url={https://www.mdpi.com/2076-3425/15/5/481},
}
Multimodal Lead-Specific Modeling of ECG for Low-Cost Pulmonary Hypertension Assessment
@misc{suvon2025multimodalleadspecificmodelingecg,
title={Multimodal Lead-Specific Modeling of ECG for Low-Cost Pulmonary Hypertension Assessment},
author={Mohammod N. I. Suvon and Shuo Zhou and Prasun C. Tripathi and Wenrui Fan and Samer Alabed and Bishesh Khanal and Venet Osmani and Andrew J. Swift and Chen and Chen and Haiping Lu},
year={2025},
eprint={2503.13470},
archivePrefix={arXiv},
primaryClass={eess.SP},
url={https://arxiv.org/abs/2503.13470},
}
Dimension Mixer: Group Mixing of Input Dimensions for Efficient Function Approximation
@misc{sapkota2024dimensionmixergroupmixing,
title={Dimension Mixer: Group Mixing of Input Dimensions for Efficient Function Approximation},
author={Suman Sapkota and Binod Bhattarai},
year={2024},
eprint={2311.18735},
archivePrefix={arXiv},
primaryClass={cs.LG},
url={https://arxiv.org/abs/2311.18735},
}
@misc{guragain2024nlpineersnludevanagariscript,
title={NLPineers@ NLU of Devanagari Script Languages 2025: Hate Speech Detection using Ensembling of BERT-based models},
author={Anmol Guragain and Nadika Poudel and Rajesh Piryani and Bishesh Khanal},
year={2024},
eprint={2412.08163},
archivePrefix={arXiv},
primaryClass={cs.CL},
url={https://arxiv.org/abs/2412.08163},
}
https://github.com/Anmol2059/NLPineers
Exploring transfer learning in medical image segmentation using vision-language models
@article{poudel2023exploring,
title={Exploring transfer learning in medical image segmentation using vision-language models},
author={Poudel, Kanchan and Dhakal, Manish and Bhandari, Prasiddha and Adhikari, Rabin and Thapaliya, Safal and Khanal, Bishesh},
journal={arXiv preprint arXiv:2308.07706},
year={2023}
}
Although transfer learning from natural to medical images has been explored for image only segmentation models, the joint representation of vision-language in segmentation problems remains underexplored. This study introduces the first systematic study on transferring VLSMs to 2D medical images, using carefully curated 11 datasets encompassing diverse modalities and insightful language prompts and experiments. Our findings demon strate that although VLSMs show competitive performance compared to image-only models for segmentation after finetuning in limited medical image datasets, not all VLSMs utilize the additional information from language prompts, with image features playing a dominant role. While VLSMs exhibit enhanced performance in handling pooled datasets with diverse modalities and show potential robustness to domain shifts compared to conventional seg mentation models, our results suggest that novel approaches are required to enable VLSMs to leverage the various auxiliary information available through language prompts. The code and datasets are available at:
https://github.com/naamiinepal/medvlsm.
TuneVLSeg: Prompt Tuning Benchmark for Vision-Language Segmentation Models
@article{adhikari2024tunevlsegprompttuningbenchmark,
title={TuneVLSeg: Prompt Tuning Benchmark for Vision-Language Segmentation Models},
author={Rabin Adhikari and Safal Thapaliya and Manish Dhakal and Bishesh Khanal},
year={2024},
eprint={2410.05239},
archivePrefix={arXiv},
primaryClass={cs.CV},
url={https://arxiv.org/abs/2410.05239},
}
https://github.com/naamiinepal/tunevlseg
@article{nakarmi2023deep,
title={Deep-learning assisted detection and quantification of (oo) cysts of Giardia and Cryptosporidium on smartphone microscopy images},
author={Nakarmi, Suprim and Pudasaini, Sanam and Thapaliya, Safal and Upretee, Pratima and Shrestha, Retina and Giri, Basant and Neupane, Bhanu Bhakta and Khanal, Bishesh},
journal={arXiv preprint arXiv:2304.05339},
year={2023}
}
T2FNorm: Train-time Feature Normalization for OOD Detection in Image Classification
@inproceedings{regmi2024t2fnorm,
title={T2FNorm: Train-time Feature Normalization for OOD Detection in Image Classification},
author={Regmi, Sudarshan and Panthi, Bibek and Dotel, Sakar and Gyawali, Prashnna K and Stoyanov, Danail and Bhattarai, Binod},
booktitle={Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition},
pages={153--162},
year={2024}
}
Task-Aware Active Learning for Endoscopic Polyp Segmentation
@article{amgain2024investigationfederatedlearningalgorithms,
title={Investigation of Federated Learning Algorithms for Retinal Optical Coherence Tomography Image Classification with Statistical Heterogeneity},
author={Sanskar Amgain and Prashant Shrestha and Sophia Bano and Ignacio del Valle Torres and Michael Cunniffe and Victor Hernandez and Phil Beales and Binod Bhattarai},
year={2024},
eprint={2402.10035},
archivePrefix={arXiv},
primaryClass={cs.CV},
url={https://arxiv.org/abs/2402.10035},
}
Methods: We investigate the effectiveness of FedAvg and FedProx to train an OCT image classification model in a decentralized fashion, addressing privacy concerns associated with centralizing data. We partitioned a publicly available OCT dataset across multiple clients under IID and Non-IID settings and conducted local training on the subsets for each client. We evaluated two federated learning methods, FedAvg and FedProx for these settings.
Results: Our experiments on the dataset suggest that under IID settings, both methods perform on par with training on a central data pool. However, the performance of both algorithms declines as we increase the statistical heterogeneity across the client data, while FedProx consistently performs better than FedAvg in the increased heterogeneity settings.
Conclusion: Despite the effectiveness of federated learning in the utilization of private data across multiple medical institutions, the large number of clients and heterogeneous distribution of labels deteriorate the performance of both algorithms. Notably, FedProx appears to be more robust to the increased heterogeneity.
iHuman: Instant Animatable Digital Humans From Monocular Videos
@article{paudel2024ihuman,
title={iHuman: Instant Animatable Digital Humans From Monocular Videos},
author={Paudel, Pramish and Khanal, Anubhav and Chhatkuli, Ajad and Paudel, Danda Pani and Tandukar, Jyoti},
journal={arXiv preprint arXiv:2407.11174},
year={2024}
}
@article{khanal2024active,
title={Active Label Refinement for Robust Training of Imbalanced Medical Image Classification Tasks in the Presence of High Label Noise},
author={Khanal, Bidur and Dai, Tianhong and Bhattarai, Binod and Linte, Cristian},
journal={arXiv preprint arXiv:2407.05973},
year={2024}
}
@article{khanal2024does,
title={How does self-supervised pretraining improve robustness against noisy labels across various medical image classification datasets?},
author={Khanal, Bidur and Bhattarai, Binod and Khanal, Bishesh and Linte, Cristian},
journal={arXiv preprint arXiv:2401.07990},
year={2024}
}
@article{poudel2024car,
title={CAR-MFL: Cross-Modal Augmentation by Retrieval for Multimodal Federated Learning with Missing Modalities},
author={Poudel, Pranav and Shrestha, Prashant and Amgain, Sanskar and Shrestha, Yash Raj and Gyawali, Prashnna and Bhattarai, Binod},
journal={arXiv preprint arXiv:2407.08648},
year={2024}
}
@article{pokhrel2024tta,
title={TTA-OOD: Test-time Augmentation for Improving Out-of-Distribution Detection in Gastrointestinal Vision},
author={Pokhrel, Sandesh and Bhandari, Sanjay and Vazquez, Eduard and Lambrou, Tryphon and Gyawali, Prashnna and Bhattarai, Binod},
journal={arXiv preprint arXiv:2407.14024},
year={2024}
}
@misc{pokhrel2024crosstaskdataaugmentationpseudolabel,
title={Cross-Task Data Augmentation by Pseudo-label Generation for Region Based Coronary Artery Instance Segmentation},
author={Sandesh Pokhrel and Sanjay Bhandari and Eduard Vazquez and Yash Raj Shrestha and Binod Bhattarai},
year={2024},
eprint={2310.05990},
archivePrefix={arXiv},
primaryClass={eess.IV},
url={https://arxiv.org/abs/2310.05990}
}
@article{Khanal2024InvestigatingTR,
title={Investigating the Robustness of Vision Transformers against Label Noise in Medical Image Classification},
author={Bidur Khanal and Prashant Shrestha and Sanskar Amgain and Bishesh Khanal and Binod Bhattarai and Cristian A. Linte},
journal={ArXiv},
year={2024},
volume={abs/2402.16734},
url={https://api.semanticscholar.org/CorpusID:268678393}
}
ReweightOOD: Loss Reweighting for Distance-based OOD Detection
@inproceedings{regmi2024reweightood,
title={ReweightOOD: Loss Reweighting for Distance-based OOD Detection},
author={Regmi, Sudarshan and Panthi, Bibek and Ming, Yifei and Gyawali, Prashnna K and Stoyanov, Danail and Bhattarai, Binod},
booktitle={Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops},
year={2024},
pages={131--141}
}
AI-Assisted Cervical Cancer Screening
@article{Poudel2024AIAssistedCC,
title={AI-Assisted Cervical Cancer Screening},
author={Poudel, Kanchan and Poudel, Lisasha and Shakya, Prabin Raj and Poudel, Atit and Shrestha, Archana and Khanal, Bishesh},
journal={arXiv preprint arXiv:2403.11936},
year={2024}
}
VLSM-Adapter: Finetuning Vision-Language Segmentation Efficiently with Lightweight Blocks
@article{dhakal2024vlsm,
title={VLSM-Adapter: Finetuning Vision-Language Segmentation Efficiently with Lightweight Blocks},
author={Dhakal, Manish and Adhikari, Rabin and Thapaliya, Safal and Khanal, Bishesh},
journal={arXiv preprint arXiv:2405.06196},
month={May 10}
}
Metric Transform: Exploring beyond Affine Transform for Neural Networks
@article{sapkota2023metric,
title={Metric Transform: Exploring beyond Affine Transform for Neural Networks},
author={Sapkota, Suman and Bhattarai, Binod},
year={2023}
}
@article{jha2023objective,
title={An objective validation of polyp and instrument segmentation methods in colonoscopy through Medico 2020 polyp segmentation and MedAI 2021 transparency challenges},
author={Jha, Debesh and Sharma, Vanshali and Banik, Debapriya and Bhattacharya, Debayan and Roy, Kaushiki and Hicks, Steven A and Tomar, Nikhil Kumar and Thambawita, Vajira and Krenzer, Adrian and Ji, Ge-Peng and others},
journal={arXiv preprint arXiv:2307.16262},
year={2023}
}
@inproceedings{adhikari2023synthetic,
title={Synthetic Boost: Leveraging Synthetic Data for Enhanced Vision-Language Segmentation in Echocardiography},
author={Adhikari, Rabin and Dhakal, Manish and Thapaliya, Safal and Poudel, Kanchan and Bhandari, Prasiddha and Khanal, Bishesh},
booktitle={International Workshop on Advances in Simplifying Medical Ultrasound},
pages={89--99},
year={2023},
organization={Springer}
}
Exploring transfer learning in medical image segmentation using vision-language models
@article{poudel2023exploring,
title={Exploring transfer learning in medical image segmentation using vision-language models},
author={Poudel, Kanchan and Dhakal, Manish and Bhandari, Prasiddha and Adhikari, Rabin and Thapaliya, Safal
and Khanal, Bishesh},
journal={arXiv preprint arXiv:2308.07706},
year={2023}
}
@article{lekadir2023future,
title={FUTURE-AI: International consensus guideline for trustworthy and deployable artificial intelligence
in healthcare},
author={Lekadir, Karim and Feragen, Aasa and Fofanah, Abdul Joseph and Frangi, Alejandro F and Buyx, Alena
and Emelie, Anais and Lara, Andrea and Porras, Antonio R and Chan, An-Wen and Navarro, Arcadi and others},
journal={arXiv preprint arXiv:2309.12325},
year={2023}
}
Improving Medical Image Classification in Noisy Labels Using Only Self-supervised Pretraining
@inproceedings{khanal2023improving,
title={Improving Medical Image Classification in Noisy Labels Using only Self-supervised Pretraining},
author={Khanal, Bidur and Bhattarai, Binod and Khanal, Bishesh and Linte, Cristian A},
booktitle={MICCAI Workshop on Data Engineering in Medical Imaging},
pages={78--90},
year={2023},
organization={Springer}
}
@article{nwoye2023cholectriplet2022,
title={CholecTriplet2022: Show me a tool and tell me the triplet--an endoscopic vision
challenge for surgical action triplet detection},
author={Nwoye, Chinedu Innocent and Yu, Tong and Sharma, Saurav and Murali, Aditya and Alapatt, Deepak and Vardazaryan, Armine and Yuan, Kun and Hajek, Jonas and Reiter, Wolfgang and Yamlahi, Amine and others},
journal={arXiv preprint arXiv:2302.06294},
year={2023}
}
Emerging Avenue of Artificial Intelligence and Ethical Considerations
@article{khanal2023emerging,
title={Emerging Avenue of Artificial Intelligence and Ethical Considerations},
author={Khanal, Bishesh},
year={2023}
}
Neural Network Pruning for Real-time Polyp Segmentation
title={Neural Network Pruning for Real-time Polyp Segmentation},
author={Sapkota, Suman and Poudel, Pranav and Regmi, Sudarshan and Panthi, Bibek and Bhattarai, Binod},
journal={arXiv preprint arXiv:2306.13203},
year={2023}
}
@article{khanal2023m, <
title={M-VAAL: Multimodal Variational Adversarial Active Learning for Downstream Medical
Image Analysis Tasks},
author={Khanal, Bidur and Bhattarai, Binod and Khanal, Bishesh and Stoyanov, Danail and
Linte, Cristian A},
journal={arXiv preprint arXiv:2306.12376},
year={2023}
}
A Client-server Deep Federated Learning for Cross-domain Surgical Image Segmentation
@article{subedi2023client,
title={A Client-server Deep Federated Learning for Cross-domain Surgical Image Segmentation},
author={Subedi, Ronast and Gaire, Rebati Raman and Ali, Sharib and Nguyen, Anh and Stoyanov, Danail and Bhattarai, Binod},
journal={arXiv preprint arXiv:2306.08720},
year={2023}
}
T2FNorm: Extremely Simple Scaled Train-time Feature Normalization for OOD Detection
@article{regmi2023t2fnorm,
title={T2FNorm: Extremely Simple Scaled Train-time Feature Normalization for OOD Detection},
author={Regmi, Sudarshan and Panthi, Bibek and Dotel, Sakar and Gyawali, Prashnna K and Stoynov, Danail and Bhattarai, Binod},
journal={arXiv preprint arXiv:2305.17797},
year={2023}
}
@article{bhattarai2022histogram,
title={Histogram of Oriented Gradients Meet Deep Learning: A Novel Multi-task Deep Network for Medical Image Semantic Segmentation},
author={Bhattarai, Binod and Subedi, Ronast and Gaire, Rebati Raman and Vazquez, Eduard and Stoyanov, Danail},
journal={arXiv preprint arXiv:2204.01712},
year={2022}
}
Benchmarking Encoder-Decoder Architectures for Biplanar X-ray to 3D Bone Shape Reconstruction
@article{hasan2022challenges,
title={Challenges of deep learning methods for COVID-19 detection using public datasets},
author={Hasan, Md Kamrul and Alam, Md Ashraful and Dahal, Lavsen and Roy, Shidhartho and Wahid, Sifat Redwan and Elahi, Md Toufick E and Mart{\'\i}, Robert and Khanal, Bishesh},
journal={Informatics in Medicine Unlocked},
volume={30},
pages={100945},
year={2022},
publisher={Elsevier}
}
Investigating the impact of class-dependent label noise in medical image classification
@article{}
@article{bano2023placental,
title={Placental Vessel Segmentation and Registration in Fetoscopy: Literature Review and
MICCAI FetReg2021 Challenge Findings},
author={Bano, Sophia and Casella, Alessandro and Vasconcelos, Francisco and Qayyum, Abdul
and Benzinou, Abdesslam and Mazher, Moona and Meriaudeau, Fabrice and Lena, Chiara and Cintorrino, Ilaria
Anita and De Paolis, Gaia Romana and others},
journal={Medical Image Analysis},
year={2023}
}
@article{sapkota2021input,
title={Input Invex Neural Network},
author={Sapkota, Suman and Bhattarai, Binod},
journal={arXiv preprint arXiv:2106.08748},
year={2023}
}
Fast fetal head compounding from multi-view 3D ultrasound
@article{wright2023fast,
title={Fast fetal head compounding from multi-view 3D ultrasound},
author={Wright, Robert and Gomez, Alberto and Zimmer, Veronika A and Toussaint,
Nicolas and Khanal, Bishesh and Matthew, Jacqueline and Skelton, Emily and Kainz, Bernhard and Rueckert, Daniel
and Hajnal, Joseph V and others},
journal={Medical Image Analysis},
pages={102793},
year={2023},
publisher={Elsevier}
}
@book{albarqouni2022distributed,
title={Distributed, Collaborative, and Federated Learning, and Affordable AI and
Healthcare for Resource Diverse Global Health: Third MICCAI Workshop, DeCaF 2022, and Second MICCAI
Workshop, FAIR 2022, Held in Conjunction with MICCAI 2022, Singapore, September 18 and 22, 2022,
Proceedings},
author={Albarqouni, Shadi and Bakas, Spyridon and Bano, Sophia and Cardoso, M
Jorge and Khanal, Bishesh and Landman, Bennett and Li, Xiaoxiao and Qin, Chen and Rekik, Islem and Rieke,
Nicola and others},
volume={13573},
year={2022},
publisher={Springer Nature}
}
Noisy Heuristics NAS: A Network Morphism based Neural Architecture Search using Heuristics
@article{sapkota2022noisy,
title={Noisy Heuristics NAS: A Network Morphism based Neural Architecture
Search using Heuristics},
author={Sapkota, Suman and Bhattarai, Binod},
journal={arXiv preprint arXiv:2207.04467},
year={2022}
}
NepBERTa: Nepali Language Model Trained in a Large Corpus
@inproceedings{timilsina-etal-2022-nepberta,
title = "{N}ep{BERT}a: {N}epali Language Model Trained in a Large Corpus",
author = "Timilsina, Sulav and Gautam, Milan and Bhattarai, Binod",
booktitle = "Proceedings of the 2nd Conference of the Asia-Pacific
Chapter of the Association for Computational Linguistics and the 12th International Joint Conference on
Natural Language Processing (Volume 2: Short Papers)",
month = nov,
year = "2022",
address = "Online only",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2022.aacl-short.34",
pages = "273--284",
}
Challenges of Deep Learning Methods for COVID-19 Detection Using Public Datasets
@article{Hasan2020.11.07.20227504,
author = {Hasan, Md. Kamrul and Alam, Md. Ashraful and Dahal, Lavsen
and Elahi, Md. Toufick E and Roy,
Shidhartho and Wahid, Sifat Redwan and Mart\'i, Robert and Khanal,
Bishesh},
title = {Challenges of Deep Learning Methods for COVID-19 Detection
Using Public Datasets},
elocation-id = {2020.11.07.20227504},
year = {2020},
doi = {10.1101/2020.11.07.20227504},
publisher = {Cold Spring Harbor Laboratory Press},
}
COVID-19-related Nepali Tweets Classification in a Low Resource Setting
@inproceedings{adhikari-etal-2022-covid,
title = "{COVID}-19-related {N}epali Tweets Classification in a
Low Resource Setting",
author = "Adhikari, Rabin and Thapaliya, Safal and Basnet,
Nirajan and Poudel, Samip and Shakya,
Aman and Khanal, Bishesh",
booktitle = "Proceedings of The Seventh Workshop on Social Media
Mining for Health Applications,
Workshop & Shared Task",
month = oct,
year = "2022",
address = "Gyeongju, Republic of Korea",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2022.smm4h-1.52",
pages = "209--215",
}
FixMatchSeg: Fixing FixMatch for Semi-Supervised Semantic Segmentation
@article{upretee2022fixmatchseg,
title={FixMatchSeg: Fixing FixMatch for Semi-Supervised Semantic Segmentation},
author={Upretee, Pratima and Khanal, Bishesh},
journal={arXiv preprint arXiv:2208.00400},
year={2022}
}
Task-Aware Active Learning for Endoscopic Polyp Segmentation
@article{thapa2023task,
title={Task-Aware Active Learning for Endoscopic Polyp Segmentation},
author={Thapa, Shrawan Kumar and Poudel, Pranav and Regmi, Sudarshan and Bhattarai, Binod and Stoyanov, Danail},
year={2023},
publisher={TechRxiv}
}
Label Geometry Aware Discriminator for Conditional Generative Networks
@inproceedings{sapkota2022label,
title={Label Geometry Aware Discriminator for Conditional Generative Adversarial Networks},
author={Sapkota, Suman and Khanal, Bidur and Bhattarai, Binod and Khanal, Bishesh and Kim, Tae-Kyun},
booktitle={2022 26th International Conference on Pattern Recognition (ICPR)},
pages={2914--2920},
year={2022},
organization={IEEE}
}
TGANet: Text-guided attention for improved polyp segmentation
@InProceedings{10.1007/978-3-031-16437-8_15,
author="Tomar, Nikhil Kumar and Jha, Debesh and Bagci, Ulas and Ali, Sharib",
editor="Wang, Linwei and Dou, Qi and Fletcher, P. Thomas and Speidel, Stefanie and Li, Shuo",
title="TGANet: Text-Guided Attention for Improved Polyp Segmentation",
booktitle="Medical Image Computing and Computer Assisted Intervention -- MICCAI 2022",
year="2022",
publisher="Springer Nature Switzerland",
address="Cham",
pages="151--160",
isbn="978-3-031-16437-8"
}
Task-Aware Active Learning for Endoscopic Image Analysis
@article{thapa2022task,
title={Task-Aware Active Learning for Endoscopic Image Analysis},
author={Thapa, Shrawan Kumar and Poudel, Pranav and Bhattarai, Binod and Stoyanov,Danail},
journal={arXiv preprint arXiv:2204.03440},
year={2022}
}
@article{ali2022assessing,
title={Assessing generalisability of deep learning-based polyp detection and segmentation
methods through a computer vision challenge},
author={Ali, Sharib and Ghatwary, Noha and Jha, Debesh and Isik-Polat, Ece and Polat, Gorkem and
Yang, Chen and Li, Wuyang and Galdran, Adrian and Ballester, Miguel-{\'A}ngel Gonz{\'a}lez and Thambawita,
Vajira and others},
journal={arXiv preprint arXiv:2202.12031},
year={2022}
}
Machine-Learning-Assisted Analysis of Colorimetric Assays on Paper Analytical Devices
@article{khanal2021machine,
title={Machine-Learning-Assisted Analysis of Colorimetric Assays on Paper Analytical Devices},
author={Khanal, Bidur and Pokhrel, Pravin and Khanal, Bishesh and Giri, Basant},
journal={ACS omega},
volume={6},
number={49},
pages={33837--33845},
year={2021},
publisher={ACS Publications}
}
Iterative deep learning for improved segmentation of endoscopic images
@article{ali2021iterative,
title={Iterative deep learning for improved segmentation of endoscopic images},
author={Ali, Sharib and Tomar, Nikhil K},
journal={Nordic Machine Intelligence},
volume={1},
number={1},
pages={38--40},
year={2021}
}
@article{wang2021evaluation,
title={Evaluation and Comparison of Accurate Automated Spinal Curvature Estimation Algorithms
with Spinal Anterior-posterior X-Ray Images: The AASCE2019 Challenge},
author={Wang, Liansheng and Xie, Cong and Lin, Yi and Zhou, Hong-Yu and Chen, Kailin and Cheng,
Dalong and Dubost, Florian and Collery, Benjamin and Khanal, Bidur and Khanal, Bishesh and others},
journal={Medical Image Analysis},
pages={102115},
year={2021},
publisher={Elsevier}
}
Visualising Argumentation Graphs with Graph Embeddings and t-SNE
@article{malmqvist2021visualising,
title={Visualising Argumentation Graphs with Graph Embeddings and t-SNE},
author={Malmqvist, Lars and Yuan, Tommy and Manandhar, Suresh},
journal={arXiv preprint arXiv:2107.00528},
year={2021}
}
COVID-19 control strategies and intervention effects in resource limited settings: a modeling study
@article{pandey2021covid,
title={COVID-19 control strategies and intervention effects in resource limited settings: a
modeling study},
author={Pandey, Kiran Raj and Subedee, Anup and Khanal, Bishesh and Koirala, Bhagawan},
journal={Plos one},
volume={16},
number={6},
pages={e0252570},
year={2021},
publisher={Public Library of Science San Francisco, CA USA}
}
Penalizing small errors using an Adaptive Logarithmic Loss
@inproceedings{kaul2021penalizing,
title={Penalizing small errors using an adaptive logarithmic loss},
author={Kaul, Chaitanya and Pears, Nick and Dai, Hang and Murray-Smith, Roderick and Manandhar,
Suresh},
booktitle={International Conference on Pattern Recognition},
pages={368--375},
year={2021},
organization={Springer}
}
FatNet: A feature-attentive network for 3D point cloud processing
@inproceedings{kaul2021fatnet,
title={FatNet: A feature-attentive network for 3D point cloud processing},
author={Kaul, Chaitanya and Pears, Nick and Manandhar, Suresh},
booktitle={2020 25th International Conference on Pattern Recognition (ICPR)},
pages={7211--7218},
year={2021},
organization={IEEE}
}
Ensemble U-Net model for efficient polyp segmentation
@article{shrestha2020ensemble,
title={Ensemble U-Net model for efficient polyp segmentation},
author={Shrestha, Shruti and Khanal, Bishesh and Ali, Sharib},
year={2020}
}
@article{SKELTON2021519,
title={Towards automated extraction of 2D standard fetal head planes from 3D ultrasound
acquisitions: A clinical evaluation and quality assessment comparison},
journal={Radiography},
volume={27},
number={2},
pages={519-526},
year={2021},
issn={1078-8174},
doi={https://doi.org/10.1016/j.radi.2020.11.006},
url={https://www.sciencedirect.com/science/article/pii/S1078817420302352},
author={E. Skelton and J. Matthew and Y. Li and B. Khanal and J.J. {Cerrolaza Martinez} and N.
Toussaint and C. Gupta and C. Knight and B. Kainz and J.V. Hajnal and M. Rutherford},
keywords={Clinical evaluation, Fetal imaging, Quality assessment, Ultrasound}
}
Methods: Two observers retrospectively reviewed standard fetal head planes against pre-defined image quality criteria. Forty-eight images (29 transventricular, 19 transcerebellar) were selected from 91 transabdominal fetal scans (mean gestational age ¼ 26 completed weeks, range ¼ 20þ5e32þ3 weeks). Each had two-dimensional (2D) manually-acquired (2D-MA), 3D operator-selected (3D-OS) and 3D-DL automatically-acquired (3D-DL) images. The proportion of adequate images from each plane and modality, and the number of inadequate images per plane was compared for each method. Inter and intraobserver agreement of overall image quality was calculated.
Results: Sixty-seven percent of 3D-OS and 3D-DL transventricular planes were adequate quality. Fortyf ive percent of 3D-OS and 55% of 3D-DL transcerebellar planes were adequate. Seventy-one percent of 3D-OS and 86% of 3D-DL transventricular planes failed with poor visualisation of intra-cranial structures. Eighty-six percent of 3D-OS and 80% of 3D-DL transcerebellar planes failed due to inadequate visualisation of cerebellar hemispheres. Image quality was significantly different between 2D and 3D, however, no significant difference between 3D-modalities was demonstrated (p < 0.005). Inter-observer agreement of transventricular plane adequacy was moderate for both 3D-modalities, and weak for transcerebellar planes.
Conclusion: The 3D-DL algorithm can automatically extract standard fetal head planes from 3D-head volumes of comparable quality to operator-selected planes. Image quality in 3D is inferior to corresponding 2D planes, likely due to limitations with 3D-technology and acquisition technique. Implications for practice: Automated image extraction of standard planes from US-volumes could facilitate use of 3DUS in clinical practice, however image quality is dependent on the volume acquisition technique.
Determining the Acceptability of Abstract Arguments with Graph Convolutional Networks
@inproceedings{malmqvist2020determining,
title={Determining the Acceptability of Abstract Arguments with Graph Convolutional Networks.},
author={Malmqvist, Lars and Yuan, Tommy and Nightingale, Peter and Manandhar, Suresh},
booktitle={SAFA@ COMMA},
pages={47--56},
year={2020}
}
Uncertainty Estimation in Deep 2D Echocardiography Segmentation
@misc{dahal2020uncertainty, <
title={Uncertainty Estimation in Deep 2D Echocardiography Segmentation},
author={Lavsen Dahal and Aayush Kafle and Bishesh Khanal},
year={2020},
eprint={2005.09349},
archivePrefix={arXiv},
primaryClass={cs.CV}
}
Automatic Cobb Angle Detection using Vertebra Detector and Vertebra Corners Regression
@misc{khanal2019automaticcobbangledetection,
title={Automatic Cobb Angle Detection using Vertebra Detector and Vertebra Corners Regression},
author={Bidur Khanal and Lavsen Dahal and Prashant Adhikari and Bishesh Khanal},
year={2019},
eprint={1910.14202},
archivePrefix={arXiv},
primaryClass={cs.CV},
url={https://arxiv.org/abs/1910.14202},
}
Image Reconstruction in a Manifold of Image Patches: Application to Whole-fetus Ultrasound Imaging
@inproceedings{gomez2019image,
title={Image Reconstruction in a Manifold of Image Patches: Application to Whole-fetus
Ultrasound Imaging},
author={Gomez, Alberto and Zimmer, Veronika and Toussaint, Nicolas and Wright, Robert and
Clough, James R. and Khanal, Bishesh and Poppel, Milou Van and Skelton, Emily and Matthews,
Jackie and Schnabel, Julia A.},
booktitle={Machine Learning for Medical Image Reconstruction - MLMIR},
year={2019},
note={Accepted}
}
Towards whole placenta segmentation at late gestation using multi-view ultrasound images
@inproceedings{zimmer2019towards,
title={Towards whole placenta segmentation at late gestation using multi-view ultrasound images},
author={Zimmer, Veronika and Gomez, Alberto and Skelton, Emily and Toussaint, Nicolas and
Zhang, Tong and Khanal, Bishesh and Wright, Robert and Noh,
Yohan and Ho, Alison and Matthew, Jacqueline and Schnabel, Julia},
booktitle={MICCAI},
year={2019}
}
Confident Head Circumference Measurement from Ultrasound with Real-time Feedback for Sonographers
@inproceedings{budd2019confident,
title={Confident Head Circumference Measurement from Ultrasound with Real-time Feedback for Sonographers},
author={Budd, Samuel and Sinclair, Matthew and Khanal, Bishesh and Matthew, Jacqueline and
Llyod, David and Gomez, Alberto and Toussaint, Nicolas and Robinson, Emma and Kainz, Bernhard},
booktitle={MICCAI},
year={2019},
note={Accepted}
}
Complete Fetal Head Compounding from Multi-View 3D Ultrasound
@inproceedings{wright2019complete,
title={Complete Fetal Head Compounding from Multi-View 3D Ultrasound},
author={Wright, Robert and Toussaint, Nicolas and Gomez, Alberto and Zimmer, Veronika and Matthew, Jacqueline and Skelton, Emily and Khanal, Bishesh and Kainz, Bernhard and Reuckert, Daniel and Hajnal, Jo and Schnabel, Julia},
booktitle={MICCAI},
year={2019},
note={Accepted}
}
Adapted and Oversegmenting Graphs: Application to Geometric Deep Learning
@article{gomez2018oversegmenting,
title={Oversegmenting Graphs},
author={Gomez, Alberto and Zimmer, Veronika A and Khanal, Bishesh and Toussaint, Nicolas and
Schnabel, Julia A},
journal={arXiv preprint arXiv:1806.00411},
year={2018},
note={under review}
}

