Copyright © 2026 Authors retain the copyright of this article. This article is an open access article distributed under the Creative Commons Attribution License which permits unrestricted use, distribution, and reproduction in any medium, provided the original work is properly cited.
@article{192699,
author = {Mulla Sheema Anjum and VANNEAL SANGEETHA and MYDUKUR SWETHA SREE and GOLLALADOODI VANITHA SREE and S. S. RAJA KUMARI and Dr. P. Veeresh},
title = {INTELLIGENT VISUAL INQUIRY SYSTEM USING DEEP LEARNING AND NLP FOR CONTEXTUAL RESPONSE GENERATION},
journal = {International Journal of Innovative Research in Technology},
year = {2026},
volume = {12},
number = {9},
pages = {1950-1954},
issn = {2349-6002},
url = {https://ijirt.org/article?manuscript=192699},
abstract = {The system is a research project on developing a Visual Inquiry (VI) system utilizing deep learning for visual comprehension and Natural Language Processing (NLP) for making context- based replies. VI systems are intended to understand and respond to visual content questions to deliver natural-style cognition and interaction. The system leverages Convolutional Neural Networks (CNNs) to obtain the visual features of the images to obtain salient facts like objects, scenes, and spatial relationships. They are then merged with NLP models that detect the input question in an attempt to display a compound presentation of text and image knowledge. Worthy of mention here are the use of state-of-the-art models such as attention mechanisms and Transformer models to project the image features onto the semantic features of the question. Attention layers enable the model to attend to the correct location in the image and enhance the accuracy of response generation. VI system is trained on vast amounts of data, for example, the VI v2 or Visual Genome dataset, with labeled images, questions, and answers. With the addition of vision and language processing, this VI system is able to answer appropriately to various types of questions, ranging from object recognition to more abstract reasoning questions.},
keywords = {Convolution Neural Networks (CNN), Vision Transaction, Image segmentation, Large Language Models (LLms), Transformer Architecture (BERT, GPT, T5), Question Answering Systems, Named Entity Recognition},
month = {February},
}
Cite This Article
Submit your research paper and those of your network (friends, colleagues, or peers) through your IPN account, and receive 800 INR for each paper that gets published.
Join NowNational Conference on Sustainable Engineering and Management - 2024 Last Date: 15th March 2024
Submit inquiry