Xiaoying Pan, Ningxin Jia, Yuanzhen Mu, Weidong Bai
{"title":"MSFE-PANet: Improved YOLOv4-based Small Object Detection Method in Complex Scenes","authors":"Xiaoying Pan, Ningxin Jia, Yuanzhen Mu, Weidong Bai","doi":"10.1142/s0218001423500246","DOIUrl":"https://doi.org/10.1142/s0218001423500246","url":null,"abstract":"With the rapid development of computer vision and artificial intelligence technology, visual object detection has made unprecedented progress, and small object detection in complex scenes has attracted more and more attention. To solve the problems of ambiguity, overlap and occlusion in small object detection in complex scenes. In this paper, a multi-scale fusion feature enhanced path aggregation network MSFE-PANet is proposed. By adding attention mechanism and feature fusion, the fusion of strong positioning information of deep feature map and strong semantic information of shallow feature map is enhanced, which helps the network to find interesting areas in complex scenes and improve its sensitivity to small objects. The rejection loss function and network prediction scale are designed to solve the problems of missing detection and false detection of overlapping and blocking small objects in complex backgrounds. The proposed method achieves an accuracy of 40.7% on the VisDrone2021 dataset and 89.7% on the PASCAL VOC dataset. Comparative analysis with mainstream object detection algorithms proves the superiority of this method in detecting small objects in complex scenes.","PeriodicalId":54949,"journal":{"name":"International Journal of Pattern Recognition and Artificial Intelligence","volume":"49 1","pages":"0"},"PeriodicalIF":0.0,"publicationDate":"2023-08-01","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"135872875","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":4,"RegionCategory":"计算机科学","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}
{"title":"TCNN Architecture for Partial Occlusion Handling in Pedestrian Classification","authors":"M. Thu, N. Suvonvorn","doi":"10.1142/s0218001423500258","DOIUrl":"https://doi.org/10.1142/s0218001423500258","url":null,"abstract":"","PeriodicalId":54949,"journal":{"name":"International Journal of Pattern Recognition and Artificial Intelligence","volume":" ","pages":""},"PeriodicalIF":1.5,"publicationDate":"2023-07-28","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"41736317","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":4,"RegionCategory":"计算机科学","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}
G. Wang, Mingliang Zhou, Bin Fang, Yugui Zhang, Shouqin Guan, Bin Ruan, Zelin Li
{"title":"Fast 3D Object Measurement based on Point Cloud Modeling","authors":"G. Wang, Mingliang Zhou, Bin Fang, Yugui Zhang, Shouqin Guan, Bin Ruan, Zelin Li","doi":"10.1142/s0218001423550133","DOIUrl":"https://doi.org/10.1142/s0218001423550133","url":null,"abstract":"","PeriodicalId":54949,"journal":{"name":"International Journal of Pattern Recognition and Artificial Intelligence","volume":"1 1","pages":""},"PeriodicalIF":1.5,"publicationDate":"2023-07-28","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"63936064","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":4,"RegionCategory":"计算机科学","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}
{"title":"Multi-scale Orthogonal Model CNN-Transformer For Medical Image Segmentation","authors":"Wuyi Zhou, Xianhua Zeng, Mingkun Zhou","doi":"10.1142/s0218001423370016","DOIUrl":"https://doi.org/10.1142/s0218001423370016","url":null,"abstract":"","PeriodicalId":54949,"journal":{"name":"International Journal of Pattern Recognition and Artificial Intelligence","volume":" ","pages":""},"PeriodicalIF":1.5,"publicationDate":"2023-07-28","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"42925531","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":4,"RegionCategory":"计算机科学","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}
{"title":"Multi-Network based Ensemble Deep Learning model to Forecast Ross River virus Outbreak in Australia","authors":"Mohd Sakib, Tamanna Siddiqui","doi":"10.1142/s0218001423520158","DOIUrl":"https://doi.org/10.1142/s0218001423520158","url":null,"abstract":"","PeriodicalId":54949,"journal":{"name":"International Journal of Pattern Recognition and Artificial Intelligence","volume":" ","pages":""},"PeriodicalIF":1.5,"publicationDate":"2023-07-28","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"49066325","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":4,"RegionCategory":"计算机科学","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}
Xingquan Cai, R. Lu, Pengyan Cheng, Jiali Yao, Yan Hu
{"title":"An Extended Labanotation Generation Method Based on 3D Human Pose Estimation for Intangible Cultural Heritage Dance Videos","authors":"Xingquan Cai, R. Lu, Pengyan Cheng, Jiali Yao, Yan Hu","doi":"10.1142/s0218001423550121","DOIUrl":"https://doi.org/10.1142/s0218001423550121","url":null,"abstract":"","PeriodicalId":54949,"journal":{"name":"International Journal of Pattern Recognition and Artificial Intelligence","volume":"22 1","pages":""},"PeriodicalIF":1.5,"publicationDate":"2023-07-28","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"63936024","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":4,"RegionCategory":"计算机科学","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}