Xu Wang, Yifan Li, Qiudan Zhang, Wenhui Wu, Mark Junjie Li, Lin Ma, Jianmin Jiang
{"title":"Weakly-Supervised 3D Scene Graph Generation via Visual-Linguistic Assisted Pseudo-labeling","authors":"Xu Wang, Yifan Li, Qiudan Zhang, Wenhui Wu, Mark Junjie Li, Lin Ma, Jianmin Jiang","doi":"10.1109/tmm.2024.3443670","DOIUrl":"https://doi.org/10.1109/tmm.2024.3443670","url":null,"abstract":"","PeriodicalId":13273,"journal":{"name":"IEEE Transactions on Multimedia","volume":"27 1","pages":""},"PeriodicalIF":7.3,"publicationDate":"2024-08-16","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"142178737","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":1,"RegionCategory":"计算机科学","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}
{"title":"Controllable Syllable-Level Lyrics Generation from Melody with Prior Attention","authors":"Zhe Zhang, Yi Yu, Atsuhiro Takasu","doi":"10.1109/tmm.2024.3443664","DOIUrl":"https://doi.org/10.1109/tmm.2024.3443664","url":null,"abstract":"","PeriodicalId":13273,"journal":{"name":"IEEE Transactions on Multimedia","volume":"6 1","pages":""},"PeriodicalIF":7.3,"publicationDate":"2024-08-15","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"142178740","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":1,"RegionCategory":"计算机科学","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}
{"title":"Anti-Collapse Loss for Deep Metric Learning","authors":"Xiruo Jiang, Yazhou Yao, Xili Dai, Fumin Shen, Liqiang Nie, Heng-Tao Shen","doi":"10.1109/tmm.2024.3443616","DOIUrl":"https://doi.org/10.1109/tmm.2024.3443616","url":null,"abstract":"","PeriodicalId":13273,"journal":{"name":"IEEE Transactions on Multimedia","volume":"4 1","pages":""},"PeriodicalIF":7.3,"publicationDate":"2024-08-15","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"142178739","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":1,"RegionCategory":"计算机科学","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}
Di Wang, Xiantao Lu, Quan Wang, Yumin Tian, Bo Wan, Lihuo He
{"title":"Gist,Content,Target-Oriented:A 3-Level Human-Like Framework for Video Moment Retrieval","authors":"Di Wang, Xiantao Lu, Quan Wang, Yumin Tian, Bo Wan, Lihuo He","doi":"10.1109/tmm.2024.3443672","DOIUrl":"https://doi.org/10.1109/tmm.2024.3443672","url":null,"abstract":"","PeriodicalId":13273,"journal":{"name":"IEEE Transactions on Multimedia","volume":"46 1","pages":""},"PeriodicalIF":7.3,"publicationDate":"2024-08-14","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"142178711","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":1,"RegionCategory":"计算机科学","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}
Yonghao Dong, Le Wang, Sanping Zhou, Gang Hua, Changyin Sun
{"title":"Sparse Pedestrian Character Learning for Trajectory Prediction","authors":"Yonghao Dong, Le Wang, Sanping Zhou, Gang Hua, Changyin Sun","doi":"10.1109/tmm.2024.3443591","DOIUrl":"https://doi.org/10.1109/tmm.2024.3443591","url":null,"abstract":"","PeriodicalId":13273,"journal":{"name":"IEEE Transactions on Multimedia","volume":"39 1","pages":""},"PeriodicalIF":7.3,"publicationDate":"2024-08-14","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"142178744","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":1,"RegionCategory":"计算机科学","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}
Heng Huang, Lin Zhao, Haixing Dai, Lu Zhang, Xintao Hu, Dajiang Zhu, Tianming Liu
{"title":"BI-AVAN: A Brain-Inspired Adversarial Visual Attention Network for Characterizing Human Visual Attention from Neural Activity","authors":"Heng Huang, Lin Zhao, Haixing Dai, Lu Zhang, Xintao Hu, Dajiang Zhu, Tianming Liu","doi":"10.1109/tmm.2024.3443623","DOIUrl":"https://doi.org/10.1109/tmm.2024.3443623","url":null,"abstract":"","PeriodicalId":13273,"journal":{"name":"IEEE Transactions on Multimedia","volume":"386 1","pages":""},"PeriodicalIF":7.3,"publicationDate":"2024-08-14","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"142178707","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":1,"RegionCategory":"计算机科学","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}
{"title":"RCVS: A Unified Registration and Fusion Framework for Video Streams","authors":"Housheng Xie, Meng Sang, Yukuan Zhang, Yang Yang, Shan Zhao, Jianbo Zhong","doi":"10.1109/tmm.2024.3443673","DOIUrl":"https://doi.org/10.1109/tmm.2024.3443673","url":null,"abstract":"","PeriodicalId":13273,"journal":{"name":"IEEE Transactions on Multimedia","volume":"81 1","pages":""},"PeriodicalIF":7.3,"publicationDate":"2024-08-14","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"142178741","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":1,"RegionCategory":"计算机科学","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}