diff options
| author | jules@lens <julescarbon@gmail.com> | 2019-02-20 18:36:25 +0100 |
|---|---|---|
| committer | jules@lens <julescarbon@gmail.com> | 2019-02-20 18:36:25 +0100 |
| commit | 2116027843edad22d87e6a56269b26cd6aafb8e8 (patch) | |
| tree | ae15c70898a3ee28668a154ccdc1e600af51834c /site/datasets/citations/coco.json | |
| parent | 1ef0b07c0bbd779f3ab9b618a0edb768b927816e (diff) | |
updating all reports
Diffstat (limited to 'site/datasets/citations/coco.json')
| -rw-r--r-- | site/datasets/citations/coco.json | 2 |
1 files changed, 1 insertions, 1 deletions
diff --git a/site/datasets/citations/coco.json b/site/datasets/citations/coco.json index e7fc0b8d..76389ffb 100644 --- a/site/datasets/citations/coco.json +++ b/site/datasets/citations/coco.json @@ -1 +1 @@ -{"id": "5e0f8c355a37a5a89351c02f174e7a5ddcb98683", "paper": {"paperId": "5e0f8c355a37a5a89351c02f174e7a5ddcb98683", "key": "coco", "title": "Microsoft COCO: Common Objects in Context", "journal": "Unknown", "address": "", "address_type": "", "lat": "", "lng": "", "pdf_link": "https://arxiv.org/pdf/1405.0312.pdf", "report_link": "papers/5e0f8c355a37a5a89351c02f174e7a5ddcb98683.html", "citation_count": 999, "citations_geocoded": 551, "citations_unknown": 448, "citations_empty": 30, "citations_pdf": 793, "citations_doi": 193, "name": "COCO"}, "address": null, "citations": [["Generating Natural Video Descriptions via Multimodal Processing", "", "Carnegie Mellon University", "Carnegie Mellon University", "Carnegie Mellon University Silicon Valley, South Akron Road, ARC, Santa Clara County, California, 94035-0016, USA", "37.41021930", "-122.05965487", "edu", "", "2016"], ["Pyramid Scene Parsing Network", "", "SenseTime", "SenseTime", "China, Beijing Shi, Haidian Qu, WuDaoKou, Zhongguancun E Rd, 1\u53f7-7", "39.99300800", "116.32988200", "company", "1 Zhongguancun E Rd, Haidian Qu, China", "2017"], ["Analysis of Spatial, Temporal, and Content Characteristics of Videos in the YFCC100M Dataset", "Yonsei University, Incheon, South Korea", "Yonsei University", "Yonsei University", "\uc5f0\uc138\ub300, \uc5f0\uc138\ub85c, \uc2e0\ucd0c\ub3d9, \ucc3d\ucc9c\ub3d9, \uc11c\ub300\ubb38\uad6c, \uc11c\uc6b8\ud2b9\ubcc4\uc2dc, 03789, \ub300\ud55c\ubbfc\uad6d", "37.56004060", "126.93692480", "edu", "", "2016"], ["Context-Aware Captions from Context-Agnostic Supervision", "", "Georgia Institute of Technology", "Georgia Institute of Technology", "Georgia Tech, Atlantic Drive Northwest, Bellwood, Rockdale, Atlanta, Fulton County, Georgia, 30318, USA", "33.77603300", "-84.39884086", "edu", "", "2017"], ["GLA: Global\u2013Local Attention for Image Description", "Key Laboratory of Intelligent Information Processing, Institute of Computing Technology, Chinese Academy of Sciences, Beijing, China", "Chinese Academy of Sciences", "Chinese Academy of Sciences", "\u4e2d\u56fd\u79d1\u5b66\u9662\u5fc3\u7406\u7814\u7a76\u6240, 16, \u6797\u8403\u8def, \u671d\u9633\u533a / Chaoyang, \u5317\u4eac\u5e02, 100101, \u4e2d\u56fd", "40.00447950", "116.37023800", "edu", "", "2018"], ["Generative Attention Model with Adversarial Self-learning for Visual Question Answering", "National University of Singapore, Singapore, Singapore", "National University of Singapore", "National University of Singapore", "NUS, Former 1936 British Outpost, Nepal Hill, Clementi, Southwest, 117542, Singapore", "1.29620180", "103.77689944", "edu", "", "2017"], ["Superpixel Filtering for Mean Field Inference in CRFs Integrated with Convolutional Neural Networks", "", "University of Oxford", "University of Oxford", "Radcliffe Camera, Radcliffe Square, Grandpont, Oxford, Oxon, South East, England, OX1 4AJ, UK", "51.75345380", "-1.25400997", "edu", "", "2015"], ["Computer Vision and Deep Learning for Automated Surveillance Technology", "", "Stanford University", "Stanford University", "Stanford University, Memorial Way, Stanford, Santa Clara County, California, 94305-6015, USA", "37.43131385", "-122.16936535", "edu", "", "2016"], ["Socratic Learning: Augmenting Generative Models to Incorporate Latent Subsets in Training Data", "", "Stanford University", "Stanford University", "Stanford University, Memorial Way, Stanford, Santa Clara County, California, 94305-6015, USA", "37.43131385", "-122.16936535", "edu", "", "2016"], ["Multi-Person Pose Estimation for PoseTrack with Enhanced Part Affinity Fields", "", "China", "China", "China", "35.86166000", "104.19539700", "edu", "", "2017"], ["ChestX-Ray8: Hospital-Scale Chest X-Ray Database and Benchmarks on Weakly-Supervised Classification and Localization of Common Thorax Diseases", "", "National Institutes of Health", "National Institutes of Health", "NIH, Pooks Hill, Bethesda, Montgomery County, Maryland, USA", "39.00041165", "-77.10327775", "edu", "", "2017"], ["Where to put the Image in an Image Caption Generator", "", "University of Malta", "University of Malta", "University of Malta, Ring Road, Japanese Garden, L-Imsida, Malta, MSD 9027, Malta", "35.90232260", "14.48341890", "edu", "", "2018"], ["Towards Context-aware Interaction Recognition", "", "University of Adelaide", "University of Adelaide", "University of Adelaide, North Terrace, Adelaide, 5000, City of Adelaide, South Australia, 5000, Australia", "-34.91892260", "138.60423668", "edu", "", "2017"], ["Regional Gating Neural Networks for Multi-label Image Classification", "", "Shanghai, China", "Shanghai, China", "Shanghai, China", "31.23039040", "121.47370210", "edu", "", "2016"], ["BDD100K: A Diverse Driving Video Database with Scalable Annotation Tooling", "", "Peking University", "Peking University", "\u5317\u4eac\u5927\u5b66, 5\u53f7, \u9890\u548c\u56ed\u8def, \u7a3b\u9999\u56ed\u5357\u793e\u533a, \u6d77\u6dc0\u533a, \u5317\u4eac\u5e02, 100871, \u4e2d\u56fd", "39.99223790", "116.30393816", "edu", "", "2018"], ["The Color of the Cat is Gray: 1 Million Full-Sentences Visual Question Answering (FSVQA).", "", "University of Tokyo", "University of Tokyo", "\u6771\u4eac\u5927\u5b66 \u67cf\u30ad\u30e3\u30f3\u30d1\u30b9, \u5b66\u878d\u5408\u306e\u9053, \u67cf\u5e02, \u5343\u8449\u770c, \u95a2\u6771\u5730\u65b9, 277-8583, \u65e5\u672c", "35.90204480", "139.93622009", "edu", "", "2016"], ["Accurate, Large Minibatch SGD: Training ImageNet in 1 Hour.", "", "Facebook", "Facebook", "250 Bryant St, Mountain View, CA 94041, USA", "37.39367170", "-122.08072620", "company", "Facebook, Mountain View, CA", "2017"], ["Action Classification via Concepts and Attributes", "", "Weizmann Institute of Science", "Weizmann Institute of Science", "\u05de\u05db\u05d5\u05df \u05d5\u05d9\u05e6\u05de\u05df \u05dc\u05de\u05d3\u05e2, \u05e9\u05d3\u05e8\u05ea \u05de\u05e8\u05db\u05d5\u05e1 \u05d6\u05d9\u05d5, \u05de\u05e2\u05d5\u05e0\u05d5\u05ea \u05e9\u05d9\u05d9\u05df, \u05d0\u05d7\u05d5\u05d6\u05d5\u05ea \u05d4\u05e0\u05e9\u05d9\u05d0, \u05e8\u05d7\u05d5\u05d1\u05d5\u05ea, \u05de\u05d7\u05d5\u05d6 \u05d4\u05de\u05e8\u05db\u05d6, NO, \u05d9\u05e9\u05e8\u05d0\u05dc", "31.90784990", "34.81334092", "edu", "", "2018"], ["A survey on social image understanding", "School of Computer Science and Technology", "China", "China", "China", "35.86166000", "104.19539700", "edu", "", "2017"], ["Automated Melanoma Recognition in Dermoscopy Images via Very Deep Residual Networks", "Department of Computer Science and Engineering, The Chinese University of Hong Kong, Hong Kong", "Chinese University of Hong Kong", "The Chinese University of Hong Kong", "\u4e2d\u5927 CUHK, NA\u68af New Asia Stairs, \u99ac\u6599\u6c34 Ma Liu Shui, \u4e5d\u809a\u6751 Kau To Village, \u6c99\u7530\u5340 Sha Tin District, \u65b0\u754c New Territories, HK, DD193 1191, \u4e2d\u56fd", "22.42031295", "114.20788644", "edu", "", "2017"], ["Learning to Learn: Model Regression Networks for Easy Small Sample Learning", "", "Robotics Institute", "Robotics Institute", "Institute for Field Robotics, \u0e1b\u0e23\u0e30\u0e0a\u0e32\u0e2d\u0e38\u0e17\u0e34\u0e28, \u0e01\u0e23\u0e38\u0e07\u0e40\u0e17\u0e1e\u0e21\u0e2b\u0e32\u0e19\u0e04\u0e23, \u0e40\u0e02\u0e15\u0e23\u0e32\u0e29\u0e0e\u0e23\u0e4c\u0e1a\u0e39\u0e23\u0e13\u0e30, \u0e01\u0e23\u0e38\u0e07\u0e40\u0e17\u0e1e\u0e21\u0e2b\u0e32\u0e19\u0e04\u0e23, 10140, \u0e1b\u0e23\u0e30\u0e40\u0e17\u0e28\u0e44\u0e17\u0e22", "13.65450525", "100.49423171", "edu", "", "2016"], ["Grounding of Textual Phrases in Images by Reconstruction", "", "Max Planck Institute for Informatics", "Max Planck Institute for Informatics", "MPII, E1 4, Campus, Universit\u00e4t, Sankt Johann, Bezirk Mitte, Saarbr\u00fccken, Regionalverband Saarbr\u00fccken, Saarland, 66123, Deutschland", "49.25795660", "7.04577417", "edu", "", "2016"], ["Image Captioning with Sentiment Terms via Weakly-Supervised Sentiment Dataset", "", "Tokyo, Japan", "Tokyo, Japan", "Tokyo, Japan", "35.68948750", "139.69170640", "edu", "", "2016"], ["iLab-20M: A Large-Scale Controlled Object Dataset to Investigate Deep Learning", "", "Amirkabir University of Technology", "Amirkabir University of Technology", "\u062f\u0627\u0646\u0634\u06af\u0627\u0647 \u0635\u0646\u0639\u062a\u06cc \u0627\u0645\u06cc\u0631\u06a9\u0628\u06cc\u0631, \u0648\u0644\u06cc \u0639\u0635\u0631, \u0645\u06cc\u062f\u0627\u0646 \u0648\u0644\u06cc\u0639\u0635\u0631, \u0645\u0646\u0637\u0642\u0647 \u06f6 \u0634\u0647\u0631 \u062a\u0647\u0631\u0627\u0646, \u062a\u0647\u0631\u0627\u0646, \u0628\u062e\u0634 \u0645\u0631\u06a9\u0632\u06cc \u0634\u0647\u0631\u0633\u062a\u0627\u0646 \u062a\u0647\u0631\u0627\u0646, \u0634\u0647\u0631\u0633\u062a\u0627\u0646 \u062a\u0647\u0631\u0627\u0646, \u0627\u0633\u062a\u0627\u0646 \u062a\u0647\u0631\u0627\u0646, \u0646\u0628\u0634 \u0628\u0631\u0627\u062f\u0631\u0627\u0646 \u0645\u0638\u0641\u0631, \u200f\u0627\u06cc\u0631\u0627\u0646\u200e", "35.70451400", "51.40972058", "edu", "", "2016"], ["Social Image Tags as a Source of Word Embeddings: A Task-oriented Evaluation", "", "Waseda University", "Waseda University", "\u65e9\u7a32\u7530\u5927\u5b66 \u5317\u4e5d\u5dde\u30ad\u30e3\u30f3\u30d1\u30b9, 2-2, \u6709\u6bdb\u5f15\u91ce\u7dda, \u516b\u5e61\u897f\u533a, \u5317\u4e5d\u5dde\u5e02, \u798f\u5ca1\u770c, \u4e5d\u5dde\u5730\u65b9, 808-0135, \u65e5\u672c", "33.88987280", "130.70856205", "edu", "", "2018"], ["Modeling Image Virality with Pairwise Spatial Transformer Networks", "", "MIT", "Massachusetts Institute", "MIT, Amherst Street, Cambridgeport, Cambridge, Middlesex County, Massachusetts, 02238, USA", "42.35839610", "-71.09567788", "edu", "", "2017"], ["Aided Action Recognition Using Single Images", "", "Lehigh University", "Lehigh University", "Lehigh University, Library Drive, Sayre Park, Bethlehem, Northampton County, Pennsylvania, 18015, USA", "40.60680280", "-75.37824880", "edu", "", "2017"], ["Weakly- and Semi-supervised Panoptic Segmentation", "", "University of Oxford", "University of Oxford", "Radcliffe Camera, Radcliffe Square, Grandpont, Oxford, Oxon, South East, England, OX1 4AJ, UK", "51.75345380", "-1.25400997", "edu", "", "2018"], ["Learning Object Detectors from Scratch with Gated Recurrent Feature Pyramids", "", "Fudan University", "Fudan University", "\u590d\u65e6\u5927\u5b66, 220, \u90af\u90f8\u8def, \u4e94\u89d2\u573a\u8857\u9053, \u6768\u6d66\u533a, \u4e0a\u6d77\u5e02, 200433, \u4e2d\u56fd", "31.30104395", "121.50045497", "edu", "", "2017"], ["ScaleNet: Guiding Object Proposal Generation in Supermarkets and Beyond", "", "Shanghai University", "Shanghai University", "\u4e0a\u6d77\u5927\u5b66, \u9526\u79cb\u8def, \u5927\u573a\u9547, \u5b9d\u5c71\u533a (Baoshan), \u4e0a\u6d77\u5e02, 201906, \u4e2d\u56fd", "31.32235655", "121.38400941", "edu", "", "2017"], ["Auto-DeepLab: Hierarchical Neural Architecture Search for Semantic Image Segmentation", "", "Stanford University", "Stanford University", "Stanford University, Memorial Way, Stanford, Santa Clara County, California, 94305-6015, USA", "37.43131385", "-122.16936535", "edu", "", "2019"], ["Image Caption with Endogenous\u2013Exogenous Attention", "School of Electronic and Information Engineering, Sun Yat-sen University, Guangzhou, China", "Sun Yat-Sen University", "Sun Yat-Sen University", "\u4e2d\u5927, \u65b0\u6e2f\u897f\u8def, \u9f99\u8239\u6ed8, \u5eb7\u4e50, \u6d77\u73e0\u533a (Haizhu), \u5e7f\u5dde\u5e02, \u5e7f\u4e1c\u7701, 510105, \u4e2d\u56fd", "23.09461185", "113.28788994", "edu", "", "2019"], ["Identity-Aware Textual-Visual Matching with Latent Co-attention", "", "Chinese University of Hong Kong", "The Chinese University of Hong Kong", "\u4e2d\u5927 CUHK, NA\u68af New Asia Stairs, \u99ac\u6599\u6c34 Ma Liu Shui, \u4e5d\u809a\u6751 Kau To Village, \u6c99\u7530\u5340 Sha Tin District, \u65b0\u754c New Territories, HK, DD193 1191, \u4e2d\u56fd", "22.42031295", "114.20788644", "edu", "", "2017"], ["Multi-label image classification with recurrently learning semantic dependencies", "School of Computer and Information, Hefei University of Technology, Hefei, China", "Hefei University of Technology", "Hefei University of Technology", "\u5408\u80a5\u5de5\u4e1a\u5927\u5b66\uff08\u5c6f\u6eaa\u8def\u6821\u533a\uff09, 193\u53f7, \u5357\u4e00\u73af\u8def, \u822a\u8fd0\u5357\u6751, \u5305\u516c\u8857\u9053, \u5408\u80a5\u5e02\u533a, \u5408\u80a5\u5e02, \u5b89\u5fbd\u7701, 230009, \u4e2d\u56fd", "31.84691800", "117.29053367", "edu", "", "2018"], ["Can You See the (Linguistic) Difference? Exploring Mass/Count Distinction in Vision", "", "University of Padova", "University of Padova", "Via Giovanni Gradenigo, 6, 35131 Padova PD, Italy", "45.40811720", "11.89437860", "edu", "University of Padova, Via Gradenigo, 6 - 35131- Padova, Italy", "2017"], ["Dropout during inference as a model for neurological degeneration in an image captioning network", "", "University of Toronto", "University of Toronto", "University of Toronto, St. George Street, Bloor Street Culture Corridor, Old Toronto, Toronto, Ontario, M5S 1A5, Canada", "43.66333345", "-79.39769975", "edu", "", "2018"], ["Weakly-Supervised Visual Grounding of Phrases with Linguistic Structures", "", "University of California, Davis", "University of California, Davis", "University of California, Davis, Apiary Drive, Yolo County, California, 95616-5270, USA", "38.53363490", "-121.79077264", "edu", "", "2017"], ["Deep Multimodal Learning: An Effective Method for Video Classification", "", "Tsinghua University", "Tsinghua University", "\u6e05\u534e\u5927\u5b66, 30, \u53cc\u6e05\u8def, \u4e94\u9053\u53e3, \u540e\u516b\u5bb6, \u6d77\u6dc0\u533a, 100084, \u4e2d\u56fd", "40.00229045", "116.32098908", "edu", "", "2018"], ["Predicting Motivations of Actions by Leveraging Text", "", "University of Maryland", "University of Maryland", "The Grand Garage, 5, North Paca Street, Seton Hill, Baltimore, Maryland, 21201, USA", "39.28996850", "-76.62196103", "edu", "", "2016"], ["Decoupled Classification Refinement: Hard False Positive Suppression for Object Detection", "", "Member", "Member", "1322 N Inglewood Ave, Coffeyville, KS 67337, USA", "37.05826350", "-95.67914910", "edu", "", "2018"], ["Cross-media Multi-level Alignment with Relation Attention Network", "", "Peking University", "Peking University", "\u5317\u4eac\u5927\u5b66, 5\u53f7, \u9890\u548c\u56ed\u8def, \u7a3b\u9999\u56ed\u5357\u793e\u533a, \u6d77\u6dc0\u533a, \u5317\u4eac\u5e02, 100871, \u4e2d\u56fd", "39.99223790", "116.30393816", "edu", "", "2018"], ["Non-parametric human segmentation using support vector machine", "Yonsei University, Seoul 03722, South Korea", "Yonsei University", "Yonsei University", "\uc5f0\uc138\ub300, \uc5f0\uc138\ub85c, \uc2e0\ucd0c\ub3d9, \ucc3d\ucc9c\ub3d9, \uc11c\ub300\ubb38\uad6c, \uc11c\uc6b8\ud2b9\ubcc4\uc2dc, 03789, \ub300\ud55c\ubbfc\uad6d", "37.56004060", "126.93692480", "edu", "", "2016"], ["Multispectral Pedestrian Detection via Simultaneous Detection and Segmentation", "", "China", "China", "China", "35.86166000", "104.19539700", "edu", "", "2018"], ["Toward Efficient Simultaneous Detection and Segmentation", "Peking University, National Engineering Laboratory for Video Technology, School of EE&CS, Beijing, China", "Peking University", "Peking University", "\u5317\u4eac\u5927\u5b66, 5\u53f7, \u9890\u548c\u56ed\u8def, \u7a3b\u9999\u56ed\u5357\u793e\u533a, \u6d77\u6dc0\u533a, \u5317\u4eac\u5e02, 100871, \u4e2d\u56fd", "39.99223790", "116.30393816", "edu", "", "2018"], ["Spatially Adaptive Computation Time for Residual Networks", "", "Carnegie Mellon University", "Carnegie Mellon University", "Carnegie Mellon University Silicon Valley, South Akron Road, ARC, Santa Clara County, California, 94035-0016, USA", "37.41021930", "-122.05965487", "edu", "", "2017"], ["Pre-gen Metrics: Predicting Caption Quality Metrics Without Generating Captions", "University of Malta, Msida, Malta", "University of Malta", "University of Malta", "University of Malta, Ring Road, Japanese Garden, L-Imsida, Malta, MSD 9027, Malta", "35.90232260", "14.48341890", "edu", "", "2018"], ["Deep Recurrent Convolutional Neural Network: Improving Performance For Speech Recognition", "", "Member", "Member", "1322 N Inglewood Ave, Coffeyville, KS 67337, USA", "37.05826350", "-95.67914910", "edu", "", "2016"], ["Learning to Evaluate Image Captioning", "", "Cornell University", "Cornell University", "Cornell University, Forest Home Drive, Forest Home, Tompkins County, New York, 14853, USA", "42.45055070", "-76.47835130", "edu", "", "2018"], ["Style Transfer at 100+ FPS Via Sub-Pixel Super-Resolution", "South China University of Technology", "South China University of Technology", "South China University of Technology", "\u534e\u5357\u7406\u5de5\u5927\u5b66, \u5927\u5b66\u57ce\u4e2d\u73af\u4e1c\u8def, \u5e7f\u5dde\u5927\u5b66\u57ce, \u65b0\u9020, \u756a\u79ba\u533a (Panyu), \u5e7f\u5dde\u5e02, \u5e7f\u4e1c\u7701, 510006, \u4e2d\u56fd", "23.05020420", "113.39880323", "edu", "", "2018"], ["Language Models for Image Captioning: The Quirks and What Works", "", "Microsoft", "Microsoft", "7021 S Memorial Dr, Tulsa, OK 74133, USA", "36.06303740", "-95.88099660", "edu", "", "2015"], ["Automatic Dataset Augmentation", "", "Harbin Institute of Technology", "Harbin Institute of Technology", "\u54c8\u5c14\u6ee8\u5de5\u4e1a\u5927\u5b66, \u53f8\u4ee4\u8857, \u5357\u5c97\u533a, \u54c8\u5c14\u6ee8\u5e02 / Harbin, \u9ed1\u9f99\u6c5f\u7701, 150000, \u4e2d\u56fd", "45.74139210", "126.62552755", "edu", "", "2017"], ["The Helping Hand: An Assistive Manipulation Framework Using Augmented Reality and Tongue-Drive Interfaces", "Institute for Robotics and Intelligent Machines, Georgia Institute of Technology, GA, USA", "Georgia Institute of Technology", "Georgia Institute of Technology", "Georgia Tech, Atlantic Drive Northwest, Bellwood, Rockdale, Atlanta, Fulton County, Georgia, 30318, USA", "33.77603300", "-84.39884086", "edu", "", "2018"], ["Consistent Optimization for Single-Shot Object Detection", "", "Tsinghua University", "Tsinghua University", "\u6e05\u534e\u5927\u5b66, 30, \u53cc\u6e05\u8def, \u4e94\u9053\u53e3, \u540e\u516b\u5bb6, \u6d77\u6dc0\u533a, 100084, \u4e2d\u56fd", "40.00229045", "116.32098908", "edu", "", "2019"], ["Object Proposal Generation With Fully Convolutional Networks", "Keio-National University of Singapore (NUS) Connective Ubiquitous Technology for Embodiments Center, Interactive and Digital Media Institute, NUS, Singapore", "National University of Singapore", "National University of Singapore", "NUS, Former 1936 British Outpost, Nepal Hill, Clementi, Southwest, 117542, Singapore", "1.29620180", "103.77689944", "edu", "", "2018"], ["Revisiting Graph Construction for Fast Image Segmentation", "", "Xiamen University", "Xiamen University", "\u53a6\u95e8\u5927\u5b66, \u601d\u660e\u5357\u8def Siming South Road, \u601d\u660e\u533a, \u601d\u660e\u533a (Siming), \u53a6\u95e8\u5e02 / Xiamen, \u798f\u5efa\u7701, 361005, \u4e2d\u56fd", "24.43994190", "118.09301781", "edu", "", "2018"], ["Large-Scale Sparse Learning From Noisy Tags for Semantic Segmentation", "Key Laboratory of Machine Perception, School of Electronics Engineering and Computer Science, Peking University, Beijing, China", "Peking University", "Peking University", "\u5317\u4eac\u5927\u5b66, 5\u53f7, \u9890\u548c\u56ed\u8def, \u7a3b\u9999\u56ed\u5357\u793e\u533a, \u6d77\u6dc0\u533a, \u5317\u4eac\u5e02, 100871, \u4e2d\u56fd", "39.99223790", "116.30393816", "edu", "", "2016"], ["Detection of valuable left-behind items in vehicle cabins", "Visual Information Lab, University of Bristol, UK", "University of Bristol", "University of Bristol", "Victoria Rooms, Whiteladies Road, Cliftonwood, Spike Island, Bristol, City of Bristol, South West England, England, BS8 2PY, UK", "51.45848370", "-2.60977520", "edu", "", "2017"], ["Automatic Generation of Grounded Visual Questions", "", "Tianjin University", "Tianjin University", "\u6cf0\u5c71\u822a\u7a7a\u6e2f/\u5929\u6d25\u5927\u53a6, \u67a3\u884c\u8def, \u67a3\u884c \u9ad8\u738b\u5bfa, \u957f\u57ce\u8def, \u5927\u6cb3, \u5cb1\u5cb3\u533a (Daiyue), \u6cf0\u5b89\u5e02, \u5c71\u4e1c\u7701, 271000, \u4e2d\u56fd", "36.20304395", "117.05842113", "edu", "", "2017"], ["Multi-Networks Joint Learning for Large-Scale Cross-Modal Retrieval", "University of Texas at San Antonio, San Antonio, TX, USA", "University of Texas at San Antonio", "University of Texas at San Antonio", "UTSA, Paseo Principal, San Antonio, Bexar County, Texas, 78249-1620, USA", "29.58333105", "-98.61944505", "edu", "", "2017"], ["Learning to Classify Fine-Grained Categories with Privileged Visual-Semantic Misalignment", "Institute of Automation, CAS Center for Excellence in Brain Science and Intelligence Technology, Chinese Academy of Sciences, Beijing, P.R. China", "Chinese Academy of Sciences", "Chinese Academy of Sciences", "\u4e2d\u56fd\u79d1\u5b66\u9662\u5fc3\u7406\u7814\u7a76\u6240, 16, \u6797\u8403\u8def, \u671d\u9633\u533a / Chaoyang, \u5317\u4eac\u5e02, 100101, \u4e2d\u56fd", "40.00447950", "116.37023800", "edu", "", "2017"], ["Learning a Recurrent Visual Representation for Image Caption Generation", "", "Microsoft", "Microsoft", "7021 S Memorial Dr, Tulsa, OK 74133, USA", "36.06303740", "-95.88099660", "edu", "", "2014"], ["Intelligent surveillance system for abandoned luggage", "Elektrik - Elektronik M\u00fchendisli\u011fi B\u00f6l\u00fcm\u00fc, Orta Do\u011fu Teknik \u00dcniversitesi, Kuzey K\u0131br\u0131s Kamp\u00fcs\u00fc, Kalkanl\u0131, Kuzey K\u0131br\u0131s", "Bilgisayar M\u00fchendisli\u011fi B\u00f6l\u00fcm\u00fc, Orta Do\u011fu Teknik \u00dcniversitesi, Kuzey K\u0131br\u0131s Kamp\u00fcs\u00fc, Kalkanl\u0131, Kuzey K\u0131br\u0131s", "Bilgisayar M\u00fchendisli\u011fi B\u00f6l\u00fcm\u00fc, Orta Do\u011fu Teknik \u00dcniversitesi, Kuzey K\u0131br\u0131s Kamp\u00fcs\u00fc, Kalkanl\u0131, Kuzey K\u0131br\u0131s", "Kalkanl\u0131, G\u00fczelyurt", "35.24908700", "33.02407600", "edu", "", "2018"], ["Exploring Visual Relationship for Image Captioning", "", "Sun Yat-Sen University", "Sun Yat-Sen University", "\u4e2d\u5927, \u65b0\u6e2f\u897f\u8def, \u9f99\u8239\u6ed8, \u5eb7\u4e50, \u6d77\u73e0\u533a (Haizhu), \u5e7f\u5dde\u5e02, \u5e7f\u4e1c\u7701, 510105, \u4e2d\u56fd", "23.09461185", "113.28788994", "edu", "", "2018"], ["Learning Transferrable Knowledge for Semantic Segmentation with Deep Convolutional Neural Network", "", "University of Michigan", "University of Michigan", "University of Michigan, 500, Hayward Street, Ann Arbor, Washtenaw County, Michigan, 48109, USA", "42.29421420", "-83.71003894", "edu", "", "2016"], ["ESPNet: Efficient Spatial Pyramid of Dilated Convolutions for Semantic Segmentation", "", "University of Washington", "University of Washington", "University of Washington, Rainier Vista, Montlake, University District, Seattle, King County, Washington, 98195, USA", "47.65432380", "-122.30800894", "edu", "", "2018"], ["A Multi-Layer Approach to Superpixel-based Higher-order Conditional Random Field for Semantic Image Segmentation", "", "University of Texas at Arlington", "University of Texas at Arlington", "University of Texas at Arlington, South Nedderman Drive, Arlington, Tarrant County, Texas, 76010, USA", "32.72836830", "-97.11201835", "edu", "", "2018"], ["Scene Image Synthesis from Natural Sentences Using Hierarchical Syntactic Analysis", "The University of Tokyo, Tokyo, Japan", "University of Tokyo", "University of Tokyo", "\u6771\u4eac\u5927\u5b66 \u67cf\u30ad\u30e3\u30f3\u30d1\u30b9, \u5b66\u878d\u5408\u306e\u9053, \u67cf\u5e02, \u5343\u8449\u770c, \u95a2\u6771\u5730\u65b9, 277-8583, \u65e5\u672c", "35.90204480", "139.93622009", "edu", "", "2016"], ["A Mask Regional Convolutional Neural Network Model for Segmenting Real Time Traffic Images", "Department of Electronics and Communication Engineering, Malaviya National Institute of Technology, Jaipur, Rajasthan, 302017, India", "India", "India", "India", "20.59368400", "78.96288000", "edu", "", "2018"], ["Terahertz Image Detection with the Improved Faster Region-Based Convolutional Neural Network", "", "Xidian University", "Xidian University", "Xidian University (New Campus), 266\u53f7, \u94f6\u674f\u5927\u9053, \u5357\u96f7\u6751, \u957f\u5b89\u533a (Chang'an), \u897f\u5b89\u5e02, \u9655\u897f\u7701, 710126, \u4e2d\u56fd", "34.12358250", "108.83546000", "edu", "", "2018"], ["Image Classification using Transfer Learning from Siamese Networks based on Text Metadata Similarity", "", "Stanford University", "Stanford University", "Stanford University, Memorial Way, Stanford, Santa Clara County, California, 94305-6015, USA", "37.43131385", "-122.16936535", "edu", "", "2016"], ["BubbleView: an alternative to eye-tracking for crowdsourcing image importance", "", "MIT CSAIL", "MIT CSAIL", "32 Vassar St, Cambridge, MA 02139, USA", "42.36194070", "-71.09043780", "edu", "", "2017"], ["Benchmarking and Error Diagnosis in Multi-instance Pose Estimation", "", "California Institute of Technology", "California Institute of Technology", "California Institute of Technology, San Pasqual Walk, Madison Heights, Pasadena, Los Angeles County, California, 91126, USA", "34.13710185", "-118.12527487", "edu", "", "2017"], ["Meta Networks for Neural Style Transfer", "", "Peking University", "Peking University", "\u5317\u4eac\u5927\u5b66, 5\u53f7, \u9890\u548c\u56ed\u8def, \u7a3b\u9999\u56ed\u5357\u793e\u533a, \u6d77\u6dc0\u533a, \u5317\u4eac\u5e02, 100871, \u4e2d\u56fd", "39.99223790", "116.30393816", "edu", "", "2017"], ["Revisiting Unreasonable Effectiveness of Data in Deep Learning Era", "", "Carnegie Mellon University", "Carnegie Mellon University", "Carnegie Mellon University Silicon Valley, South Akron Road, ARC, Santa Clara County, California, 94035-0016, USA", "37.41021930", "-122.05965487", "edu", "", "2017"], ["Semantic Amodal Segmentation", "", "Rutgers University", "Rutgers University", "Rutgers Cook Campus - North, Biel Road, New Brunswick, Middlesex County, New Jersey, 08901, USA", "40.47913175", "-74.43168868", "edu", "", "2017"], ["Deep Feature Pyramid Reconfiguration for Object Detection", "", "Tsinghua University", "Tsinghua University", "\u6e05\u534e\u5927\u5b66, 30, \u53cc\u6e05\u8def, \u4e94\u9053\u53e3, \u540e\u516b\u5bb6, \u6d77\u6dc0\u533a, 100084, \u4e2d\u56fd", "40.00229045", "116.32098908", "edu", "", "2018"], ["Person Search via a Mask-Guided Two-Stream CNN Model", "", "University of Sydney", "University of Sydney", "USyd, Fisher Road, Camperdown, Sydney, NSW, 2006, Australia", "-33.88890695", "151.18943366", "edu", "", "2018"], ["Employing Weak Annotations for Medical Image Analysis Problems", "", "Nagoya University", "Nagoya University", "SuperDARN (Hokkaido West), \u592a\u8f9b\u7b2c1\u652f\u7dda\u6797\u9053, \u9678\u5225\u753a, \u8db3\u5bc4\u90e1, \u5341\u52dd\u7dcf\u5408\u632f\u8208\u5c40, \u5317\u6d77\u9053, \u5317\u6d77\u9053\u5730\u65b9, \u65e5\u672c", "43.53750985", "143.60768225", "edu", "", "2017"], ["Watching the TV Watchers", "Georgia Institute of Technology, Center for Behavioral Imaging and School of Electrical and Computer Engineering, Atlanta, GA, USA", "Georgia Institute of Technology", "Georgia Institute of Technology", "Georgia Tech, Atlantic Drive Northwest, Bellwood, Rockdale, Atlanta, Fulton County, Georgia, 30318, USA", "33.77603300", "-84.39884086", "edu", "", "2018"], ["Deep Priority Hashing", "", "Tsinghua University", "Tsinghua University", "\u6e05\u534e\u5927\u5b66, 30, \u53cc\u6e05\u8def, \u4e94\u9053\u53e3, \u540e\u516b\u5bb6, \u6d77\u6dc0\u533a, 100084, \u4e2d\u56fd", "40.00229045", "116.32098908", "edu", "", "2018"], ["Single-Shot Bidirectional Pyramid Networks for High-Quality Object Detection", "", "China", "China", "China", "35.86166000", "104.19539700", "edu", "", "2018"], ["Neighbourhood Watch: Referring Expression Comprehension via Language-guided Graph Attention Networks", "", "University of Adelaide", "University of Adelaide", "University of Adelaide, North Terrace, Adelaide, 5000, City of Adelaide, South Australia, 5000, Australia", "-34.91892260", "138.60423668", "edu", "", "2018"], ["Parallel Attention: A Unified Framework for Visual Object Discovery Through Dialogs and Queries", "", "University of Adelaide", "University of Adelaide", "University of Adelaide, North Terrace, Adelaide, 5000, City of Adelaide, South Australia, 5000, Australia", "-34.91892260", "138.60423668", "edu", "", "2018"], ["Learning Instance-Aware Object Detection Using Determinantal Point Processes", "", "Seoul National University", "Seoul National University", "\uc11c\uc6b8\ub300\ud559\uad50, \uc11c\ud638\ub3d9\ub85c, \uc11c\ub454\ub3d9, \uad8c\uc120\uad6c, \uc218\uc6d0\uc2dc, \uacbd\uae30, 16614, \ub300\ud55c\ubbfc\uad6d", "37.26728000", "126.98411510", "edu", "", "2018"], ["Maximum Classifier Discrepancy for Unsupervised Domain Adaptation", "", "University of Tokyo", "University of Tokyo", "\u6771\u4eac\u5927\u5b66 \u67cf\u30ad\u30e3\u30f3\u30d1\u30b9, \u5b66\u878d\u5408\u306e\u9053, \u67cf\u5e02, \u5343\u8449\u770c, \u95a2\u6771\u5730\u65b9, 277-8583, \u65e5\u672c", "35.90204480", "139.93622009", "edu", "", "2018"], ["Multi-oriented Scene Text Detection via Corner Localization and Region Segmentation", "", "National University of Singapore", "National University of Singapore", "NUS, Former 1936 British Outpost, Nepal Hill, Clementi, Southwest, 117542, Singapore", "1.29620180", "103.77689944", "edu", "", "2018"], ["Efficient Video Object Segmentation via Network Modulation", "", "Northwestern University", "Northwestern University", "Northwestern University, Northwestern Place, Downtown, Evanston, Cook County, Illinois, 60208, USA", "42.05511640", "-87.67581113", "edu", "", "2018"], ["Strong-Weak Distribution Alignment for Adaptive Object Detection.", "", "Boston University", "Boston University", "BU, Bay State Road, Fenway, Boston, Suffolk County, Massachusetts, 02215, USA", "42.35042530", "-71.10056114", "edu", "", "2018"], ["Revisiting Dilated Convolution: A Simple Approach for Weakly- and Semi-Supervised Semantic Segmentation", "", "IBM Thomas J. Watson Research Center", "IBM Thomas J. Watson Research Center", "IBM Yorktown research lab, Adams Road, Millwood, Town of New Castle, Westchester County, New York, 10562, USA", "41.21002475", "-73.80407056", "company", "", "2018"], ["Detecting Sex From Handwritten Examples", "Fab Lab, Independent University Bangladesh, Dhaka, Bangladesh", "Independent University Bangladesh", "Fab Lab, Independent University Bangladesh, Dhaka, Bangladesh", "Independent University, Bangladesh Plot 16, \u0986\u09ab\u09a4\u09be\u09ac \u0989\u09a6\u09cd\u09a6\u09bf\u09a8 \u0986\u09b9\u09ae\u09c7\u09a6 \u09b0\u09cb\u09a1, \u09a2\u09be\u0995\u09be, Bangladesh", "23.81524690", "90.42796720", "edu", "", "2018"], ["Zero-Shot Object Detection: Learning to Simultaneously Recognize and Localize Novel Concepts", "", "Australian National University", "Australian National University", "Canberra ACT 0200, Australia", "-35.27769990", "149.11852700", "edu", "", "2018"], ["Training CNNs from Synthetic Data for Part Handling in Industrial Environments", "Mercedes-Benz-Cars Daimler AG, Stuttgart, Germany", "BTU Cottbus-Senftenberg, Chair of Automation Technology, Cottbus, Germany", "BTU Cottbus-Senftenberg, Chair of Automation Technology, Cottbus, Germany", "Platz der Deutschen Einheit 1, 03046 Cottbus, Germany", "51.76698700", "14.32695000", "edu", "", "2018"], ["Query : \" A man in a red sweatshirt performing breakdance \"", "", "University of California, Berkeley", "University of California, Berkeley", "Berkeley Art Museum and Pacific Film Archive, Bancroft Way, Southside, Berkeley, Alameda County, California, 94720-1076, USA", "37.86871260", "-122.25586815", "edu", "", "2018"], ["Semantic segmentation based on iterative contraction and merging", "National Chiao Tung University, Hsinchu, Taiwan", "National Chiao Tung University", "National Chiao Tung University", "NCTU;\u4ea4\u5927;\u4ea4\u901a\u5927\u5b78;\u4ea4\u5927\u5149\u5fa9\u6821\u5340;\u4ea4\u901a\u5927\u5b78\u5149\u5fa9\u6821\u5340, 1001, \u5927\u5b78\u8def, \u5149\u660e\u91cc, \u8d64\u571f\u5d0e, \u6771\u5340, \u65b0\u7af9\u5e02, 30010, \u81fa\u7063", "24.78676765", "120.99724412", "edu", "", "2017"], ["Image captioning using deep neural architectures", "", "India", "India", "India", "20.59368400", "78.96288000", "edu", "", "2017"], ["Training Constrained Deconvolutional Networks for Road Scene Semantic Segmentation", "", "Cambridge University", "Cambridge University", "University, Cambridge Road, Old Portsmouth, Portsmouth, South East, England, PO1 2HB, UK", "50.79440260", "-1.09717480", "edu", "", "2016"], ["A sequential guiding network with attention for image captioning", "", "North China Electric Power University", "North China Electric Power University", "\u534e\u5317\u7535\u529b\u5927\u5b66, \u6c38\u534e\u5317\u5927\u8857, \u83b2\u6c60\u533a, \u4fdd\u5b9a\u5e02, \u83b2\u6c60\u533a (Lianchi), \u4fdd\u5b9a\u5e02, \u6cb3\u5317\u7701, 071000, \u4e2d\u56fd", "38.87604460", "115.49738730", "edu", "", "2018"], ["Driver Pose Estimation by Hybrid Convolutional Network Architecture", "National Engineering Laboratory for Visual Information Processing and Applications, Xi'an, Shaanxi, 710049, China", "China", "China", "China", "35.86166000", "104.19539700", "edu", "", "2018"], ["Discriminative Learning of Open-Vocabulary Object Retrieval and Localization by Negative Phrase Augmentation", "", "University of Tokyo", "University of Tokyo", "\u6771\u4eac\u5927\u5b66 \u67cf\u30ad\u30e3\u30f3\u30d1\u30b9, \u5b66\u878d\u5408\u306e\u9053, \u67cf\u5e02, \u5343\u8449\u770c, \u95a2\u6771\u5730\u65b9, 277-8583, \u65e5\u672c", "35.90204480", "139.93622009", "edu", "", "2018"], ["A Vision-based Transfer Learning Approach for Recognizing Behavioral Symptoms in People with Dementia", "", "Edge Hill University", "Edge Hill University", "Edge Hill University, St Helens Road, West Lancashire, Lancs, North West England, England, L39 4QP, UK", "53.55821550", "-2.86904651", "edu", "", "2018"], ["Self-supervised Learning of Motion Capture", "", "University of Pittsburgh", "University of Pittsburgh", "University of Pittsburgh, Sutherland Drive, West Oakland, PGH, Allegheny County, Pennsylvania, 15240, USA", "40.44415295", "-79.96243993", "edu", "", "2017"], ["Visual Dialog", "", "Georgia Institute of Technology", "Georgia Institute of Technology", "Georgia Tech, Atlantic Drive Northwest, Bellwood, Rockdale, Atlanta, Fulton County, Georgia, 30318, USA", "33.77603300", "-84.39884086", "edu", "", "2017"], ["Chat-crowd: A Dialog-based Platform for Visual Layout Composition", "", "University of Virginia", "University of Virginia", "University of Virginia, Rotunda Alley, Carr's Hill, Albemarle County, Virginia, 22904-4119, USA", "38.03536820", "-78.50353220", "edu", "", "2018"], ["VISER: Visual Self-Regularization", "", "University of Washington", "University of Washington", "University of Washington, Rainier Vista, Montlake, University District, Seattle, King County, Washington, 98195, USA", "47.65432380", "-122.30800894", "edu", "", "2018"], ["BoxSup: Exploiting Bounding Boxes to Supervise Convolutional Networks for Semantic Segmentation", "", "Microsoft", "Microsoft", "7021 S Memorial Dr, Tulsa, OK 74133, USA", "36.06303740", "-95.88099660", "edu", "", "2015"], ["Visual Referring Expression Recognition: What Do Systems Actually Learn?", "", "Carnegie Mellon University", "Carnegie Mellon University", "Carnegie Mellon University Silicon Valley, South Akron Road, ARC, Santa Clara County, California, 94035-0016, USA", "37.41021930", "-122.05965487", "edu", "", "2018"], ["Auto-Encoding Scene Graphs for Image Captioning", "", "Nanyang Technological University", "Nanyang Technological University", "NTU, Faculty Avenue, Jurong West, Southwest, 637460, Singapore", "1.34841040", "103.68297965", "edu", "", "2018"], ["Dense Image Representation with Spatial Pyramid VLAD Coding of CNN for Locally Robust Captioning", "", "University of Tokyo", "University of Tokyo", "\u6771\u4eac\u5927\u5b66 \u67cf\u30ad\u30e3\u30f3\u30d1\u30b9, \u5b66\u878d\u5408\u306e\u9053, \u67cf\u5e02, \u5343\u8449\u770c, \u95a2\u6771\u5730\u65b9, 277-8583, \u65e5\u672c", "35.90204480", "139.93622009", "edu", "", "2016"], ["G-Distillation: Reducing Overconfident Errors on Novel Samples", "", "University of Illinois, Urbana-Champaign", "University of Illinois, Urbana-Champaign", "B-3, South Mathews Avenue, Urbana, Champaign County, Illinois, 61801, USA", "40.11116745", "-88.22587665", "edu", "", "2018"], ["Proposal Incorporating Structural Bias into Neural Networks", "", "Carnegie Mellon University", "Carnegie Mellon University", "Carnegie Mellon University Silicon Valley, South Akron Road, ARC, Santa Clara County, California, 94035-0016, USA", "37.41021930", "-122.05965487", "edu", "", "2017"], ["Image Captioning with an Intermediate Attributes Layer", "", "University of Adelaide", "University of Adelaide", "University of Adelaide, North Terrace, Adelaide, 5000, City of Adelaide, South Australia, 5000, Australia", "-34.91892260", "138.60423668", "edu", "", "2015"], ["Weakly Supervised Attention Learning for Textual Phrases Grounding", "", "University of California, Irvine", "University of California, Irvine", "University of California, Irvine, East Peltason Drive, Turtle Rock, Irvine, Orange County, California, 92612, USA", "33.64319010", "-117.84016494", "edu", "", "2018"], ["Identifying Most Walkable Direction for Navigation in an Outdoor Environment", "", "University of Washington", "University of Washington", "University of Washington, Rainier Vista, Montlake, University District, Seattle, King County, Washington, 98195, USA", "47.65432380", "-122.30800894", "edu", "", "2017"], ["WebVision Database: Visual Learning and Understanding from Web Data", "", "ETH Zurich", "Computer Vision Laboratory, ETH Zurich, Zurich, Switzerland", "Sternwartstrasse 7, 8092 Z\u00fcrich, Switzerland", "47.37723980", "8.55216180", "edu", "", "2017"], ["Pose Flow: Efficient Online Pose Tracking", "", "Shanghai, China", "Shanghai, China", "Shanghai, China", "31.23039040", "121.47370210", "edu", "", "2018"], ["MetaAnchor: Learning to Detect Objects with Customized Anchors", "", "Fudan University", "Fudan University", "\u590d\u65e6\u5927\u5b66, 220, \u90af\u90f8\u8def, \u4e94\u89d2\u573a\u8857\u9053, \u6768\u6d66\u533a, \u4e0a\u6d77\u5e02, 200433, \u4e2d\u56fd", "31.30104395", "121.50045497", "edu", "", "2018"], ["Image Description using Deep Neural Networks", "", "Rochester Institute of Technology", "Rochester Institute of Technology", "Rochester Institute of Technology (RIT), 1, Lomb Memorial Drive, Bailey, Henrietta Town, Monroe County, New York, 14623, USA", "43.08250655", "-77.67121663", "edu", "", "2016"], ["Combining Weakly and Webly Supervised Learning for Classifying Food Images", "", "SRI International", "SRI International", "SRI International Building, West 1st Street, Menlo Park, San Mateo County, California, 94025, USA", "37.45857960", "-122.17560525", "edu", "", "2017"], ["Measuring and Modifying the Intrinsic Memorability of Images", "", "MIT", "Massachusetts Institute", "MIT, Amherst Street, Cambridgeport, Cambridge, Middlesex County, Massachusetts, 02238, USA", "42.35839610", "-71.09567788", "edu", "", "2015"], ["SSP: Supervised Sparse Projections for Large-Scale Retrieval in High Dimensions", "", "University of British Columbia", "University of British Columbia", "University of British Columbia, Eagles Drive, Hawthorn Place, University Endowment Lands, Metro Vancouver, British Columbia, V6T, Canada", "49.25839375", "-123.24658161", "edu", "", "2016"], ["Semantic Video Segmentation by Gated Recurrent Flow Propagation", "", "Lund University", "Lund University", "TEM at Lund University, 9, Klostergatan, Stadsk\u00e4rnan, Centrum, Lund, Sk\u00e5ne, G\u00f6taland, 22222, Sverige", "55.70395710", "13.19020110", "edu", "", "2016"], ["Maya Codical Glyph Segmentation: A Crowdsourcing Approach", "Idiap Research Institute, and the School of Electrical Engineering, Swiss Federal Institute of Technology in Lausanne (EPFL), Martigny, Switzerland", "IDIAP Research Institute", "IDIAP Research Institute", "Idiap Research Institute, Parking Centre du parc, Martigny, Valais/Wallis, 1920, Schweiz/Suisse/Svizzera/Svizra", "46.10923700", "7.08453549", "edu", "", "2018"], ["Deep Learning for Classification of Colorectal Polyps on Whole-slide Images", "", "Dartmouth College", "Dartmouth College", "Dartmouth College, Tuck Mall, Hanover, Grafton County, New Hampshire, 03755, USA", "43.70479270", "-72.29259090", "edu", "", "2017"], ["Survey on the attention based RNN model and its applications in computer vision", "", "Delft University of Technology", "Delft University of Technology", "TU Delft, Mekelweg, TU-wijk, Delft, Zuid-Holland, Nederland, 2628, Nederland", "51.99882735", "4.37396037", "edu", "", "2016"], ["Scalable, High-Quality Object Detection", "", "University of Michigan", "University of Michigan", "University of Michigan, 500, Hayward Street, Ann Arbor, Washtenaw County, Michigan, 48109, USA", "42.29421420", "-83.71003894", "edu", "", "2014"], ["An Integral Pose Regression System for the ECCV2018 PoseTrack Challenge", "", "Zhejiang University", "Zhejiang University", "\u6d59\u6c5f\u5927\u5b66\u4e4b\u6c5f\u6821\u533a, \u4e4b\u6c5f\u8def, \u8f6c\u5858\u8857\u9053, \u897f\u6e56\u533a (Xihu), \u676d\u5dde\u5e02 Hangzhou, \u6d59\u6c5f\u7701, 310008, \u4e2d\u56fd", "30.19331415", "120.11930822", "edu", "", "2018"], ["ON GENERIC OBJECT RECOGNITION TECHNIQUES : CHALLENGES AND OPPORTUNITIES Prof", "", "India", "India", "India", "20.59368400", "78.96288000", "edu", "", ""], ["Joint Flow: Temporal Flow Fields for Multi Person Tracking", "", "University of Bonn", "University of Bonn", "Rheinische Friedrich-Wilhelms-Universit\u00e4t Bonn, Arkadenhof, Bonn-Zentrum, Stadtbezirk Bonn, Bonn, Regierungsbezirk K\u00f6ln, Nordrhein-Westfalen, 53113, Deutschland", "50.73381240", "7.10224650", "edu", "", "2018"], ["Snuba: Automating Weak Supervision to Label Training Data", "", "Stanford University", "Stanford University", "Stanford University, Memorial Way, Stanford, Santa Clara County, California, 94305-6015, USA", "37.43131385", "-122.16936535", "edu", "", "2018"], ["A 2 A : Attention to Attention Reasoning for Movie Question Answering", "", "Institute of Information Science", "Institute of Information Science", "\u8cc7\u8a0a\u79d1\u5b78\u7814\u7a76\u6240, \u6578\u7406\u5927\u9053, \u4e2d\u7814\u91cc, \u5357\u6e2f\u5b50, \u5357\u6e2f\u5340, \u81fa\u5317\u5e02, 11574, \u81fa\u7063", "25.04107280", "121.61475620", "edu", "", "2018"], ["Anchor Box Optimization for Object Detection", "", "Microsoft", "Microsoft", "7021 S Memorial Dr, Tulsa, OK 74133, USA", "36.06303740", "-95.88099660", "edu", "", "2018"], ["Taskonomy: Disentangling Task Transfer Learning", "", "University of California, Berkeley", "University of California, Berkeley", "Berkeley Art Museum and Pacific Film Archive, Bancroft Way, Southside, Berkeley, Alameda County, California, 94720-1076, USA", "37.86871260", "-122.25586815", "edu", "", "2018"], ["Multi-scale Location-Aware Kernel Representation for Object Detection", "", "Dalian University of Technology", "Dalian University of Technology", "\u5927\u8fde\u7406\u5de5\u5927\u5b66, \u7ea2\u51cc\u8def, \u7518\u4e95\u5b50\u533a, \u51cc\u6c34\u9547, \u7518\u4e95\u5b50\u533a / Ganjingzi, \u5927\u8fde\u5e02 / Dalian, \u8fbd\u5b81\u7701, 116023, \u4e2d\u56fd", "38.88140235", "121.52281098", "edu", "", "2018"], ["Jointly Discovering Visual Objects and Spoken Words from Raw Sensory Input", "", "MIT", "Massachusetts Institute", "MIT, Amherst Street, Cambridgeport, Cambridge, Middlesex County, Massachusetts, 02238, USA", "42.35839610", "-71.09567788", "edu", "", "2018"], ["Who Are Raising Their Hands ? Hand-Raiser Seeking Based on Object Detection and Pose Estimation", "", "Shanghai Jiao Tong University", "Shanghai Jiao Tong University", "\u4e0a\u6d77\u4ea4\u901a\u5927\u5b66\uff08\u5f90\u6c47\u6821\u533a\uff09, \u6dee\u6d77\u897f\u8def, \u756a\u79ba\u5c0f\u533a, \u5e73\u9634\u6865, \u5f90\u6c47\u533a, \u4e0a\u6d77\u5e02, 200052, \u4e2d\u56fd", "31.20081505", "121.42840681", "edu", "", "2018"], ["Robust Adversarial Perturbation on Deep Proposal-based Models", "", "GE Global Research Center", "GE Global Research Center", "GE Global Research Center, Aqueduct, Niskayuna, Schenectady County, New York, USA", "42.82982480", "-73.87719385", "edu", "", "2018"], ["Grounded Objects and Interactions for Video Captioning", "", "Georgia Institute of Technology", "Georgia Institute of Technology", "Georgia Tech, Atlantic Drive Northwest, Bellwood, Rockdale, Atlanta, Fulton County, Georgia, 30318, USA", "33.77603300", "-84.39884086", "edu", "", "2017"], ["Neural Style Transfer: A Review", "", "Member", "Member", "1322 N Inglewood Ave, Coffeyville, KS 67337, USA", "37.05826350", "-95.67914910", "edu", "", "2017"], ["Priming Neural Networks", "", "York University", "York University", "York University, Keele Campus, Campus Walk, North York, Toronto, Ontario, M3J 2S5, Canada", "43.77439110", "-79.50481085", "edu", "", "2018"], ["Neural Baby Talk", "", "Georgia Institute of Technology", "Georgia Institute of Technology", "Georgia Tech, Atlantic Drive Northwest, Bellwood, Rockdale, Atlanta, Fulton County, Georgia, 30318, USA", "33.77603300", "-84.39884086", "edu", "", "2018"], ["End-to-End Recovery of Human Shape and Pose", "", "University of California, Berkeley", "University of California, Berkeley", "Berkeley Art Museum and Pacific Film Archive, Bancroft Way, Southside, Berkeley, Alameda County, California, 94720-1076, USA", "37.86871260", "-122.25586815", "edu", "", "2018"], ["HashNet: Deep Learning to Hash by Continuation", "", "University of Illinois at Chicago", "University of Illinois at Chicago", "University of Illinois at Chicago, West Taylor Street, Greektown, Chicago, Cook County, Illinois, 60607, USA", "41.86898915", "-87.64856256", "edu", "", "2017"], ["Associative Embedding: End-to-End Learning for Joint Detection and Grouping", "", "University of Michigan", "University of Michigan", "University of Michigan, 500, Hayward Street, Ann Arbor, Washtenaw County, Michigan, 48109, USA", "42.29421420", "-83.71003894", "edu", "", "2017"], ["Towards Deep Cellular Phenotyping in Placental Histology", "", "University of Oxford", "University of Oxford", "Radcliffe Camera, Radcliffe Square, Grandpont, Oxford, Oxon, South East, England, OX1 4AJ, UK", "51.75345380", "-1.25400997", "edu", "", "2018"], ["People and Vehicles in Danger - A Fire and Flood Detection System in Social Media", "CERTH-ITI, Thessaloniki, Greece", "CERTH-ITI, Thessaloniki, Greece", "CERTH-ITI, Thessaloniki, Greece", "Thermi 570 01, Greece", "40.56676110", "22.99801470", "edu", "", "2018"], ["Channel Pruning for Accelerating Very Deep Neural Networks", "", "China", "China", "China", "35.86166000", "104.19539700", "edu", "", "2017"], ["Personalized Serious Games for Cognitive Intervention with Lifelog Visual Analytics", "Singapore Bioimaging Consortium, A*STAR, Singapore, Singapore", "National University of Singapore", "National University of Singapore", "NUS, Former 1936 British Outpost, Nepal Hill, Clementi, Southwest, 117542, Singapore", "1.29620180", "103.77689944", "edu", "", "2018"], ["From UI Design Image to GUI Skeleton: A Neural Machine Translator to Bootstrap Mobile GUI Implementation", "Nanyang Technological University, Singapore", "Nanyang Technological University", "Nanyang Technological University", "NTU, Faculty Avenue, Jurong West, Southwest, 637460, Singapore", "1.34841040", "103.68297965", "edu", "", "2018"], ["Selective Refinement Network for High Performance Face Detection", "", "University of Chinese Academy of Sciences", "University of Chinese Academy of Sciences", "University of Chinese Academy of Sciences, UCAS, Yuquanlu, \u7389\u6cc9\u8def, \u7530\u6751, \u6d77\u6dc0\u533a, 100049, \u4e2d\u56fd", "39.90828040", "116.24585270", "edu", "", "2018"], ["Describing Common Human Visual Actions in Images", "", "California Institute of Technology", "California Institute of Technology", "California Institute of Technology, San Pasqual Walk, Madison Heights, Pasadena, Los Angeles County, California, 91126, USA", "34.13710185", "-118.12527487", "edu", "", "2015"], ["Person Retrieval in Surveillance Video using Height, Color and Gender", "", "India", "India", "India", "20.59368400", "78.96288000", "edu", "", "2018"], ["A Robot Localization Framework Using CNNs for Object Detection and Pose Estimation", "", "Otto von Guericke University", "Otto von Guericke University", "Otto-von-Guericke-Universit\u00e4t Magdeburg, 2, Universit\u00e4tsplatz, Kr\u00f6kentorviertel/Breiter Weg NA, Alte Neustadt, Magdeburg, Sachsen-Anhalt, 39106, Deutschland", "52.14005065", "11.64471248", "edu", "", "2018"], ["Automatic Concept Discovery from Parallel Text and Visual Corpora", "", "Tsinghua University", "Tsinghua University", "\u6e05\u534e\u5927\u5b66, 30, \u53cc\u6e05\u8def, \u4e94\u9053\u53e3, \u540e\u516b\u5bb6, \u6d77\u6dc0\u533a, 100084, \u4e2d\u56fd", "40.00229045", "116.32098908", "edu", "", "2015"], ["Image Captioning With Visual-Semantic Double Attention", "School of Electronics and Information Technology, Sun Yat-Sen University, Guangdong, People's Republic of China", "Sun Yat-Sen University", "Sun Yat-Sen University", "\u4e2d\u5927, \u65b0\u6e2f\u897f\u8def, \u9f99\u8239\u6ed8, \u5eb7\u4e50, \u6d77\u73e0\u533a (Haizhu), \u5e7f\u5dde\u5e02, \u5e7f\u4e1c\u7701, 510105, \u4e2d\u56fd", "23.09461185", "113.28788994", "edu", "", "2019"], ["Understanding Fake Faces", "", "Waseda University", "Waseda University", "\u65e9\u7a32\u7530\u5927\u5b66 \u5317\u4e5d\u5dde\u30ad\u30e3\u30f3\u30d1\u30b9, 2-2, \u6709\u6bdb\u5f15\u91ce\u7dda, \u516b\u5e61\u897f\u533a, \u5317\u4e5d\u5dde\u5e02, \u798f\u5ca1\u770c, \u4e5d\u5dde\u5730\u65b9, 808-0135, \u65e5\u672c", "33.88987280", "130.70856205", "edu", "", "2018"], ["SketchyScene: Richly-Annotated Scene Sketches", "", "Simon Fraser University", "Simon Fraser University", "SFU Burnaby, South Campus Road, Barnet, Burnaby, Metro Vancouver, British Columbia, V5A 4X6, Canada", "49.27674540", "-122.91777375", "edu", "", "2018"], ["Much Ado About Time: Exhaustive Annotation of Temporal Data", "", "Carnegie Mellon University", "Carnegie Mellon University", "Carnegie Mellon University Silicon Valley, South Akron Road, ARC, Santa Clara County, California, 94035-0016, USA", "37.41021930", "-122.05965487", "edu", "", "2016"], ["Mainstream: Dynamic Stem-Sharing for Multi-Tenant Video Processing", "", "Carnegie Mellon University", "Carnegie Mellon University", "Carnegie Mellon University Silicon Valley, South Akron Road, ARC, Santa Clara County, California, 94035-0016, USA", "37.41021930", "-122.05965487", "edu", "", "2018"], ["A Multi-Oriented Scene Text Detector with Position-Sensitive Segmentation", "University of Chinese Academy of Sciences, Beijing, China", "University of Chinese Academy of Sciences", "University of Chinese Academy of Sciences", "University of Chinese Academy of Sciences, UCAS, Yuquanlu, \u7389\u6cc9\u8def, \u7530\u6751, \u6d77\u6dc0\u533a, 100049, \u4e2d\u56fd", "39.90828040", "116.24585270", "edu", "", "2018"], ["Simple Baselines for Human Pose Estimation and Tracking", "", "University of Electronic Science and Technology of China", "University of Electronic Science and Technology of China", "Columbus, OH 43210, USA", "40.01419050", "-83.03091430", "edu", "", "2018"], ["Image describing based on bidirectional LSTM and improved sequence sampling", "College of Computer Science. Chongqing University, Chongqing, China", "College of Computer Science. Chongqing University", "College of Computer Science. Chongqing University, Chongqing, China", "China, Chongqing Shi, Shapingba Qu, ChongQing DaXue, \u6c99\u6b63\u8857174\u53f7", "29.56488000", "106.46809700", "edu", "", "2017"], ["Image Inspired Poetry Generation in XiaoIce", "", "Microsoft", "Microsoft", "7021 S Memorial Dr, Tulsa, OK 74133, USA", "36.06303740", "-95.88099660", "edu", "", "2018"], ["Deep conditional neural network for image segmentation", "Department of Computing, The Hong Kong Polytechnic University", "Hong Kong Polytechnic University", "Hong Kong Polytechnic University", "hong kong, 11, \u80b2\u624d\u9053 Yuk Choi Road, \u5c16\u6c99\u5480 Tsim Sha Tsui, \u6cb9\u5c16\u65fa\u5340 Yau Tsim Mong District, \u4e5d\u9f8d Kowloon, HK, 00000, \u4e2d\u56fd", "22.30457200", "114.17976285", "edu", "", "2016"], ["Human Centred Object Co-Segmentation", "", "Stanford University", "Stanford University", "Stanford University, Memorial Way, Stanford, Santa Clara County, California, 94305-6015, USA", "37.43131385", "-122.16936535", "edu", "", "2016"], ["Image Captioning with both Object and Scene Information", "Institute of Computing Technology, Chinese Academy of Sciences, Beijing, China", "Chinese Academy of Sciences", "Chinese Academy of Sciences", "\u4e2d\u56fd\u79d1\u5b66\u9662\u5fc3\u7406\u7814\u7a76\u6240, 16, \u6797\u8403\u8def, \u671d\u9633\u533a / Chaoyang, \u5317\u4eac\u5e02, 100101, \u4e2d\u56fd", "40.00447950", "116.37023800", "edu", "", "2016"], ["SuperNeurons: FFT-based Gradient Sparsification in the Distributed Training of Deep Neural Networks", "", "Brown University", "Brown University", "Brown University, Waterman Street, College Hill, Providence, Bristol, Rhode Island, 02912, USA", "41.82686820", "-71.40123146", "edu", "", "2018"], ["Improving Image Captioning with Conditional Generative Adversarial Nets", "", "China", "China", "China", "35.86166000", "104.19539700", "edu", "", "2018"], ["A Data Driven Approach for Compound Figure Separation Using Convolutional Neural Networks", "", "Indiana University", "Indiana University", "Indiana University East, West Cart Road, Richmond, Wayne County, Indiana, 47374, USA", "39.86948105", "-84.87956905", "edu", "", "2017"], ["Intention Oriented Image Captions with Guiding Objects", "", "Tsinghua University", "Tsinghua University", "\u6e05\u534e\u5927\u5b66, 30, \u53cc\u6e05\u8def, \u4e94\u9053\u53e3, \u540e\u516b\u5bb6, \u6d77\u6dc0\u533a, 100084, \u4e2d\u56fd", "40.00229045", "116.32098908", "edu", "", "2018"], ["Aligning Books and Movies: Towards Story-Like Visual Explanations by Watching Movies and Reading Books", "", "MIT", "Massachusetts Institute", "MIT, Amherst Street, Cambridgeport, Cambridge, Middlesex County, Massachusetts, 02238, USA", "42.35839610", "-71.09567788", "edu", "", "2015"], ["Multi-scale Patch Aggregation (MPA) for Simultaneous Detection and Segmentation", "", "Chinese University of Hong Kong", "The Chinese University of Hong Kong", "\u4e2d\u5927 CUHK, NA\u68af New Asia Stairs, \u99ac\u6599\u6c34 Ma Liu Shui, \u4e5d\u809a\u6751 Kau To Village, \u6c99\u7530\u5340 Sha Tin District, \u65b0\u754c New Territories, HK, DD193 1191, \u4e2d\u56fd", "22.42031295", "114.20788644", "edu", "", "2016"], ["Interpretable Explanations of Black Boxes by Meaningful Perturbation", "", "University of Oxford", "University of Oxford", "Radcliffe Camera, Radcliffe Square, Grandpont, Oxford, Oxon, South East, England, OX1 4AJ, UK", "51.75345380", "-1.25400997", "edu", "", "2017"], ["A Restricted Visual Turing Test for Deep Scene and Event Understanding", "", "UCLA", "University of California, Los Angeles", "Los Angeles, CA 90095, USA", "34.06892100", "-118.44518110", "edu", "", "2015"], ["Euphrates: Algorithm-SoC Co-Design for Low-Power Mobile Continuous Vision", "", "Georgia Institute of Technology", "Georgia Institute of Technology", "Georgia Tech, Atlantic Drive Northwest, Bellwood, Rockdale, Atlanta, Fulton County, Georgia, 30318, USA", "33.77603300", "-84.39884086", "edu", "", "2018"], ["Similarity Reasoning over Semantic Context\u2013graphs", "", "Brown University", "Brown University", "Brown University, Waterman Street, College Hill, Providence, Bristol, Rhode Island, 02912, USA", "41.82686820", "-71.40123146", "edu", "", "2015"], ["Multimodal Differential Network for Visual Question Generation", "", "Indian Institute of Technology Delhi", "IIIT-Delhi, India", "IIIT-Delhi, Mathura Road, Friends Colony, South East Delhi, Delhi, 110020, India", "28.54632595", "77.27325504", "edu", "", "2018"], ["Learning Spatial Regularization with Image-Level Supervisions for Multi-label Image Classification", "", "University of Sydney", "University of Sydney", "USyd, Fisher Road, Camperdown, Sydney, NSW, 2006, Australia", "-33.88890695", "151.18943366", "edu", "", "2017"], ["Visual Question Reasoning on General Dependency Tree", "", "Sun Yat-Sen University", "Sun Yat-Sen University", "\u4e2d\u5927, \u65b0\u6e2f\u897f\u8def, \u9f99\u8239\u6ed8, \u5eb7\u4e50, \u6d77\u73e0\u533a (Haizhu), \u5e7f\u5dde\u5e02, \u5e7f\u4e1c\u7701, 510105, \u4e2d\u56fd", "23.09461185", "113.28788994", "edu", "", "2018"], ["Interactive Demonstration of Probabilistic Predicates", "University of Washington &Microsoft, Seattle, WA, USA", "Microsoft, Redmond, WA, USA", "Microsoft, Redmond, WA, USA", "5000 148th Ave NE, Redmond, WA 98052, USA", "47.65292200", "-122.14223560", "edu", "", "2018"], ["A Dataset and Exploration of Models for Understanding Video Data through Fill-in-the-Blank Question-Answering", "", "Polytechnique Montreal", "Polytechnique Montr\u00b4eal", "2900 Boulevard Edouard-Montpetit, Montr\u00e9al, QC H3T 1J4, Canada", "45.50438400", "-73.61288290", "edu", "Polytechnique Montreal, Montreal, Quebec, Canada", "2017"], ["Are You Talking to Me? Reasoned Visual Dialog Generation Through Adversarial Learning", "", "Northwestern Polytechnical University", "Northwestern Polytechnical University", "\u897f\u5317\u5de5\u4e1a\u5927\u5b66 \u53cb\u8c0a\u6821\u533a, 127\u53f7, \u53cb\u8c0a\u897f\u8def, \u957f\u5b89\u8def, \u7891\u6797\u533a (Beilin), \u897f\u5b89\u5e02, \u9655\u897f\u7701, 710072, \u4e2d\u56fd", "34.24691520", "108.91061982", "edu", "", "2018"], ["MovieQA: Understanding Stories in Movies through Question-Answering", "", "Karlsruhe Institute of Technology", "Karlsruhe Institute of Technology", "KIT, Leopoldshafener Allee, Linkenheim, Linkenheim-Hochstetten, Landkreis Karlsruhe, Regierungsbezirk Karlsruhe, Baden-W\u00fcrttemberg, 76351, Deutschland", "49.10184375", "8.43312560", "edu", "", "2016"], ["ReDMark: Framework for Residual Diffusion Watermarking on Deep Networks", "", "University of Queensland", "University of Queensland", "University of Queensland, University Drive, Hill End, St Lucia, Brisbane, QLD, 4072, Australia", "-27.49741805", "153.01316956", "edu", "", "2018"], ["Transitive Invariance for Self-Supervised Visual Representation Learning", "", "Carnegie Mellon University", "Carnegie Mellon University", "Carnegie Mellon University Silicon Valley, South Akron Road, ARC, Santa Clara County, California, 94035-0016, USA", "37.41021930", "-122.05965487", "edu", "", "2017"], ["LabelBank: Revisiting Global Perspectives for Semantic Segmentation", "", "Simon Fraser University", "Simon Fraser University", "SFU Burnaby, South Campus Road, Barnet, Burnaby, Metro Vancouver, British Columbia, V5A 4X6, Canada", "49.27674540", "-122.91777375", "edu", "", "2017"], ["Application of a Hybrid Model Based on a Convolutional Auto-Encoder and Convolutional Neural Network in Object-Oriented Remote Sensing Classification", "", "Wuhan University of Technology", "Wuhan University of Technology", "\u6b66\u6c49\u7406\u5de5\u5927\u5b66-\u4f59\u5bb6\u5934\u6821\u533a, \u4ea4\u901a\u4e8c\u8def, \u6768\u56ed\u8857\u9053, \u6b66\u660c\u533a (Wuchang), \u6b66\u6c49\u5e02, \u6e56\u5317\u7701, 430062, \u4e2d\u56fd", "30.60903415", "114.35142840", "edu", "", "2018"], ["Visual Storytelling", "", "Carnegie Mellon University", "Carnegie Mellon University", "Carnegie Mellon University Silicon Valley, South Akron Road, ARC, Santa Clara County, California, 94035-0016, USA", "37.41021930", "-122.05965487", "edu", "", "2016"], ["Boundary aware image segmentation with unsupervised mixture models", "Image Analysis Group, Technical University Dortmund, Otto-Hahn-Str. 4, 44227 Dortmund, Germany", "Technical University Dortmund", "Image Analysis Group, Technical University Dortmund, Otto-Hahn-Str. 4, 44227 Dortmund, Germany", "Emil-Figge-Stra\u00dfe 50, 44227 Dortmund, Germany", "51.49219020", "7.41413620", "edu", "", "2017"], ["Edge-Cloud Collaborative Processing for Intelligent Internet of Things: A Case Study on Smart Surveillance", "Georgia Institute of Technology", "Georgia Institute of Technology", "Georgia Institute of Technology", "Georgia Tech, Atlantic Drive Northwest, Bellwood, Rockdale, Atlanta, Fulton County, Georgia, 30318, USA", "33.77603300", "-84.39884086", "edu", "", "2018"], ["Uncovering the Temporal Context for Video Question Answering", "SCS, Carnegie Mellon University, Pittsburgh, USA", "Carnegie Mellon University", "Carnegie Mellon University", "Carnegie Mellon University Silicon Valley, South Akron Road, ARC, Santa Clara County, California, 94035-0016, USA", "37.41021930", "-122.05965487", "edu", "", "2017"], ["Inside-Outside Net: Detecting Objects in Context with Skip Pooling and Recurrent Neural Networks", "", "Cornell University", "Cornell University", "Cornell University, Forest Home Drive, Forest Home, Tompkins County, New York, 14853, USA", "42.45055070", "-76.47835130", "edu", "", "2016"], ["Deep learning-based human head detection and extraction for robotic portrait drawing", "Shenzhen Academy of Robotics, Shenzhen, Guangdong, China", "Shenzhen Academy of Robotics, Shenzhen, Guangdong, China", "Shenzhen Academy of Robotics, Shenzhen, Guangdong, China", "Shenzhen, Guangdong, China", "22.54309600", "114.05786500", "edu", "", "2017"], ["CBVMR: Content-Based Video-Music Retrieval Using Soft Intra-Modal Structure Constraint", "", "Member", "Member", "1322 N Inglewood Ave, Coffeyville, KS 67337, USA", "37.05826350", "-95.67914910", "edu", "", "2018"], ["On the Origin of Deep Learning On the Origin of Deep Learning", "", "Carnegie Mellon University", "Carnegie Mellon University", "Carnegie Mellon University Silicon Valley, South Akron Road, ARC, Santa Clara County, California, 94035-0016, USA", "37.41021930", "-122.05965487", "edu", "", "2017"], ["A survey on deep neural network-based image captioning", "School of Mechanical, Electrical and Information Engineering, Shandong University, Weihai, People\u2019s Republic of China", "Shandong University", "Shandong University", "\u5c71\u4e1c\u5927\u5b66, \u6cf0\u5b89\u8857, \u9ccc\u5c71\u536b\u8857\u9053, \u5373\u58a8\u533a, \u9752\u5c9b\u5e02, \u5c71\u4e1c\u7701, 266200, \u4e2d\u56fd", "36.36934730", "120.67381800", "edu", "", "2018"], ["An object based graph representation for video comparison", "Dept. of Electrical and Computer Engineering, NYU Tandon School of Engineering, New York, USA", "Chongqing University of Technology", "Chongqing University of Technology, China", "69 Hongguang Ave, Banan Qu, Chongqing Shi, China", "29.45832600", "106.52994700", "edu", "", "2017"], ["Phrase Localization and Visual Relationship Detection with Comprehensive Image-Language Cues", "", "University of Illinois, Urbana-Champaign", "University of Illinois, Urbana-Champaign", "B-3, South Mathews Avenue, Urbana, Champaign County, Illinois, 61801, USA", "40.11116745", "-88.22587665", "edu", "", "2017"], ["Deep image representations using caption generators", "", "Indian Institute of Science Bangalore", "Indian Institute of Science Bangalore", "IISc, Gulmohar Marg, RMV Stage II - 1st Block, Aramane Nagara Ward, West Zone, Bengaluru, Bangalore Urban, Karnataka, 560012, India", "13.02223470", "77.56718325", "edu", "", "2017"], ["Convolution Neural Networks With Two Pathways for Image Style Recognition", "Institute for Interdisciplinary Information Sciences, Tsinghua University, Beijing, China", "Tsinghua University", "Tsinghua University", "\u6e05\u534e\u5927\u5b66, 30, \u53cc\u6e05\u8def, \u4e94\u9053\u53e3, \u540e\u516b\u5bb6, \u6d77\u6dc0\u533a, 100084, \u4e2d\u56fd", "40.00229045", "116.32098908", "edu", "", "2017"], ["Natural Language Object Retrieval", "", "University of Massachusetts", "University of Massachusetts", "University of Massachusetts, Hicks Way, Amherst, Hampshire, Massachusetts, 01003, USA", "42.38897850", "-72.52869870", "edu", "", "2016"], ["Watch and learn: Semi-supervised learning of object detectors from videos", "", "Robotics Institute", "Robotics Institute", "Institute for Field Robotics, \u0e1b\u0e23\u0e30\u0e0a\u0e32\u0e2d\u0e38\u0e17\u0e34\u0e28, \u0e01\u0e23\u0e38\u0e07\u0e40\u0e17\u0e1e\u0e21\u0e2b\u0e32\u0e19\u0e04\u0e23, \u0e40\u0e02\u0e15\u0e23\u0e32\u0e29\u0e0e\u0e23\u0e4c\u0e1a\u0e39\u0e23\u0e13\u0e30, \u0e01\u0e23\u0e38\u0e07\u0e40\u0e17\u0e1e\u0e21\u0e2b\u0e32\u0e19\u0e04\u0e23, 10140, \u0e1b\u0e23\u0e30\u0e40\u0e17\u0e28\u0e44\u0e17\u0e22", "13.65450525", "100.49423171", "edu", "", "2015"], ["Advanced Deep-Learning Techniques for Salient and Category-Specific Object Detection: A Survey", "Northwestern Polytechnical University, Xi'an, 710072, China", "Northwestern Polytechnical University", "Northwestern Polytechnical University", "\u897f\u5317\u5de5\u4e1a\u5927\u5b66 \u53cb\u8c0a\u6821\u533a, 127\u53f7, \u53cb\u8c0a\u897f\u8def, \u957f\u5b89\u8def, \u7891\u6797\u533a (Beilin), \u897f\u5b89\u5e02, \u9655\u897f\u7701, 710072, \u4e2d\u56fd", "34.24691520", "108.91061982", "edu", "", "2018"], ["Word Prior Detection Segmentation Input \" The left guy \" Image : Query : a guy left the youth Energy", "", "IBM Thomas J. Watson Research Center", "IBM Thomas J. Watson Research Center", "IBM Yorktown research lab, Adams Road, Millwood, Town of New Castle, Westchester County, New York, 10562, USA", "41.21002475", "-73.80407056", "company", "", "2017"], ["Image Caption with Synchronous Cross-Attention", "Beijing University of Posts and Telecommunications, Beijing, China", "Beijing University of Posts and Telecommunications", "Beijing University of Posts and Telecommunications", "\u5317\u4eac\u90ae\u7535\u5927\u5b66, \u897f\u571f\u57ce\u8def, \u6d77\u6dc0\u533a, \u5317\u4eac\u5e02, 100082, \u4e2d\u56fd", "39.96014880", "116.35193921", "edu", "", "2017"], ["Exploring confusing scene classes for the places dataset: Insights and solutions", "Department of Electrical Engineering, University of Southern California, Los Angeles, CA 90089, U.S.A.", "University of Southern California", "University of Southern California", "University of Southern California, Watt Way, Saint James Park, LA, Los Angeles County, California, 90089, USA", "34.02241490", "-118.28634407", "edu", "", "2017"], ["Adversarial Ranking for Language Generation", "", "University of Washington", "University of Washington", "University of Washington, Rainier Vista, Montlake, University District, Seattle, King County, Washington, 98195, USA", "47.65432380", "-122.30800894", "edu", "", "2017"], ["3D-SSD: Learning Hierarchical Features from RGB-D Images for Amodal 3D Object Detection", "", "Zhejiang University", "Zhejiang University", "\u6d59\u6c5f\u5927\u5b66\u4e4b\u6c5f\u6821\u533a, \u4e4b\u6c5f\u8def, \u8f6c\u5858\u8857\u9053, \u897f\u6e56\u533a (Xihu), \u676d\u5dde\u5e02 Hangzhou, \u6d59\u6c5f\u7701, 310008, \u4e2d\u56fd", "30.19331415", "120.11930822", "edu", "", "2017"], ["DAC-SDC Low Power Object Detection Challenge for UAV Applications", "", "Member", "Member", "1322 N Inglewood Ave, Coffeyville, KS 67337, USA", "37.05826350", "-95.67914910", "edu", "", "2018"], ["Neuron-level Selective Context Aggregation for Scene Segmentation", "", "Shandong University", "Shandong University", "\u5c71\u4e1c\u5927\u5b66, \u6cf0\u5b89\u8857, \u9ccc\u5c71\u536b\u8857\u9053, \u5373\u58a8\u533a, \u9752\u5c9b\u5e02, \u5c71\u4e1c\u7701, 266200, \u4e2d\u56fd", "36.36934730", "120.67381800", "edu", "", "2017"], ["Factors Influencing The Performance of Image Captioning Model: An Evaluation", "SoICT, HUST and School of Information and Communication Technology, Hanoi University of Science and Technology, Hanoi, Vietnam", "Hanoi University of Science and Technology", "Hanoi University of Science and Technology", "HUST, Tr\u1ea7n \u0110\u1ea1i Ngh\u0129a, Hai B\u00e0 Tr\u01b0ng, H\u00e0 N\u1ed9i, 10999, Vi\u1ec7t Nam", "21.00395200", "105.84360183", "edu", "", "2016"], ["Progressive Neural Architecture Search", "", "Stanford University", "Stanford University", "Stanford University, Memorial Way, Stanford, Santa Clara County, California, 94305-6015, USA", "37.43131385", "-122.16936535", "edu", "", "2018"], ["Beyond Domain Adaptation: Unseen Domain Encapsulation via Universal Non-volume Preserving Models", "", "University of Illinois, Urbana-Champaign", "University of Illinois, Urbana-Champaign", "B-3, South Mathews Avenue, Urbana, Champaign County, Illinois, 61801, USA", "40.11116745", "-88.22587665", "edu", "", "2018"], ["Object-centric Auto-encoders and Dummy Anomalies for Abnormal Event Detection in Video", "", "Romania", "Romania", "Romania", "45.94316100", "24.96676000", "edu", "", "2018"], ["From Known to the Unknown: Transferring Knowledge to Answer Questions about Novel Visual and Semantic Concepts", "", "Australian National University", "Australian National University", "Canberra ACT 0200, Australia", "-35.27769990", "149.11852700", "edu", "", "2018"], ["Weakly Supervised Salient Object Detection Using Image Labels", "", "SenseTime", "SenseTime", "China, Beijing Shi, Haidian Qu, WuDaoKou, Zhongguancun E Rd, 1\u53f7-7", "39.99300800", "116.32988200", "company", "1 Zhongguancun E Rd, Haidian Qu, China", "2018"], ["Reducing Network Agnostophobia", "", "University of Colorado, Colorado Springs", "University of Colorado Colorado Springs", "Main Hall, The Spine, Colorado Springs, El Paso County, Colorado, 80907, USA", "38.89207560", "-104.79716389", "edu", "", "2018"], ["DistInit: Learning Video Representations without a Single Labeled Video", "", "Carnegie Mellon University", "Carnegie Mellon University", "Carnegie Mellon University Silicon Valley, South Akron Road, ARC, Santa Clara County, California, 94035-0016, USA", "37.41021930", "-122.05965487", "edu", "", "2019"], ["Image2song: Song Retrieval via Bridging Image Content and Lyric Words", "", "Northwestern Polytechnical University", "Northwestern Polytechnical University", "\u897f\u5317\u5de5\u4e1a\u5927\u5b66 \u53cb\u8c0a\u6821\u533a, 127\u53f7, \u53cb\u8c0a\u897f\u8def, \u957f\u5b89\u8def, \u7891\u6797\u533a (Beilin), \u897f\u5b89\u5e02, \u9655\u897f\u7701, 710072, \u4e2d\u56fd", "34.24691520", "108.91061982", "edu", "", "2017"], ["An efficient framework for learning sentence representations", "", "University of Michigan", "University of Michigan", "University of Michigan, 500, Hayward Street, Ann Arbor, Washtenaw County, Michigan, 48109, USA", "42.29421420", "-83.71003894", "edu", "", "2018"], ["Semantic Correspondence: A Hierarchical Approach", "", "Queensland University of Technology", "Queensland University of Technology", "Queensland University of Technology, Macgregor Lane, Merthyr, South Brisbane, Brisbane, QLD, 4000, Australia", "-27.47715625", "153.02841004", "edu", "", "2018"], ["Contextual Memory Trees", "", "Microsoft", "Microsoft", "7021 S Memorial Dr, Tulsa, OK 74133, USA", "36.06303740", "-95.88099660", "edu", "", "2018"], ["Adding object detection skills to visual dialogue agents", "", "University of Amsterdam", "University of Amsterdam", "Institute for Logic, Language and Computation (ILLC), 107, Science Park, Oost-Watergraafsmeer, Amsterdam, Oost, Amsterdam, Noord-Holland, Nederland, 1098XG, Nederland", "52.35536550", "4.95016440", "edu", "", "2018"], ["Generate, Segment and Replace: Towards Generic Manipulation Segmentation.", "", "University of Maryland", "University of Maryland", "The Grand Garage, 5, North Paca Street, Seton Hill, Baltimore, Maryland, 21201, USA", "39.28996850", "-76.62196103", "edu", "", "2018"], ["Self-view Grounding Given a Narrated 360{\\deg} Video", "", "Microsoft Research Asia", "Microsoft Live Labs Research, China", "China, Beijing Shi, Haidian Qu, Zhichun Rd, 49\u53f7\u5e0c\u683c\u739b709\u53f7 \u90ae\u653f\u7f16\u7801: 100080", "39.97721700", "116.33763200", "company", "", "2017"], ["Learning RoI Transformer for Detecting Oriented Objects in Aerial Images", "", "Wuhan University of Technology", "Wuhan University of Technology", "\u6b66\u6c49\u7406\u5de5\u5927\u5b66-\u4f59\u5bb6\u5934\u6821\u533a, \u4ea4\u901a\u4e8c\u8def, \u6768\u56ed\u8857\u9053, \u6b66\u660c\u533a (Wuchang), \u6b66\u6c49\u5e02, \u6e56\u5317\u7701, 430062, \u4e2d\u56fd", "30.60903415", "114.35142840", "edu", "", "2018"], ["Survey of Recent Advances in Visual Question Answering", "", "India", "India", "India", "20.59368400", "78.96288000", "edu", "", "2017"], ["Richer Semantic Visual and Language Representation for Video Captioning", "Tongji University, Shanghai, China", "Tongji University", "Tongji University", "\u540c\u6d4e\u5927\u5b66, 1239, \u56db\u5e73\u8def, \u6c5f\u6e7e, \u8679\u53e3\u533a, \u4e0a\u6d77\u5e02, 200092, \u4e2d\u56fd", "31.28473925", "121.49694909", "edu", "", "2017"], ["Touchdown: Natural Language Navigation and Spatial Reasoning in Visual Street Environments", "", "Cornell University", "Cornell University", "Cornell University, Forest Home Drive, Forest Home, Tompkins County, New York, 14853, USA", "42.45055070", "-76.47835130", "edu", "", "2018"], ["Visual attribute transfer through deep image analogy", "", "Microsoft", "Microsoft", "7021 S Memorial Dr, Tulsa, OK 74133, USA", "36.06303740", "-95.88099660", "edu", "", "2017"], ["Towards Improved Design and Evaluation of Epileptic Seizure Predictors", "Mayo Systems Electrophysiology Laboratory, Departments of Neurology and Biomedical EngineeringMayo Clinic", "Machine Learning GroupTechnische Universität Berlin", "Machine Learning GroupTechnische Universität Berlin", "Berlin, Germany", "52.52000660", "13.40495400", "edu", "", "2018"], ["PReMVOS: Proposal-generation, Refinement and Merging for Video Object Segmentation", "", "RWTH Aachen University", "RWTH Aachen University", "RWTH Aachen, Mies-van-der-Rohe-Stra\u00dfe, K\u00f6nigsh\u00fcgel, Aachen-Mitte, Aachen, St\u00e4dteregion Aachen, Regierungsbezirk K\u00f6ln, Nordrhein-Westfalen, 52074, Deutschland", "50.77917030", "6.06728733", "edu", "", "2018"], ["Explicit Bias Discovery in Visual Question Answering Models", "", "University of Maryland", "University of Maryland", "The Grand Garage, 5, North Paca Street, Seton Hill, Baltimore, Maryland, 21201, USA", "39.28996850", "-76.62196103", "edu", "", "2018"], ["AUTOMATIC IMAGE ANNOTATION MODEL USING LSTM APPROACH", "", "India", "India", "India", "20.59368400", "78.96288000", "edu", "", "2017"], ["Mo 2 Cap 2 : Real-time Mo bile 3 D Mo tion Cap ture with a Cap-mounted Fisheye Camera", "", "Stanford University", "Stanford University", "Stanford University, Memorial Way, Stanford, Santa Clara County, California, 94305-6015, USA", "37.43131385", "-122.16936535", "edu", "", "2018"], ["Stroke Controllable Fast Style Transfer with Adaptive Receptive Fields", "", "University of Sydney", "University of Sydney", "USyd, Fisher Road, Camperdown, Sydney, NSW, 2006, Australia", "-33.88890695", "151.18943366", "edu", "", "2018"], ["Learning 3 D Scene Synthesis from Annotated RGB-D Images", "", "Zhejiang University", "Zhejiang University", "\u6d59\u6c5f\u5927\u5b66\u4e4b\u6c5f\u6821\u533a, \u4e4b\u6c5f\u8def, \u8f6c\u5858\u8857\u9053, \u897f\u6e56\u533a (Xihu), \u676d\u5dde\u5e02 Hangzhou, \u6d59\u6c5f\u7701, 310008, \u4e2d\u56fd", "30.19331415", "120.11930822", "edu", "", "2016"], ["Bottom-up Pose Estimation of Multiple Person with Bounding Box Constraint", "", "Zhejiang University", "Zhejiang University", "\u6d59\u6c5f\u5927\u5b66\u4e4b\u6c5f\u6821\u533a, \u4e4b\u6c5f\u8def, \u8f6c\u5858\u8857\u9053, \u897f\u6e56\u533a (Xihu), \u676d\u5dde\u5e02 Hangzhou, \u6d59\u6c5f\u7701, 310008, \u4e2d\u56fd", "30.19331415", "120.11930822", "edu", "", "2018"], ["Transferable Interactiveness Prior for Human-Object Interaction Detection", "", "Shanghai Jiao Tong University", "Shanghai Jiao Tong University", "\u4e0a\u6d77\u4ea4\u901a\u5927\u5b66\uff08\u5f90\u6c47\u6821\u533a\uff09, \u6dee\u6d77\u897f\u8def, \u756a\u79ba\u5c0f\u533a, \u5e73\u9634\u6865, \u5f90\u6c47\u533a, \u4e0a\u6d77\u5e02, 200052, \u4e2d\u56fd", "31.20081505", "121.42840681", "edu", "", "2018"], ["A Fully Convolutional Two-Stream Fusion Network for Interactive Image Segmentation", "", "Loughborough University", "Loughborough University", "Computer Science, University Road, Charnwood, Leicestershire, East Midlands, England, LE11 3TP, UK", "52.76635770", "-1.22924610", "edu", "", "2019"], ["Corpus Construction and Semantic Analysis of Indonesian Image Description", "", "India", "India", "India", "20.59368400", "78.96288000", "edu", "", "2018"], ["A Corpus for Reasoning About Natural Language Grounded in Photographs", "", "University of Maryland", "University of Maryland", "The Grand Garage, 5, North Paca Street, Seton Hill, Baltimore, Maryland, 21201, USA", "39.28996850", "-76.62196103", "edu", "", "2018"], ["Persuasive Faces: Generating Faces in Advertisements", "", "University of Pittsburgh", "University of Pittsburgh", "University of Pittsburgh, Sutherland Drive, West Oakland, PGH, Allegheny County, Pennsylvania, 15240, USA", "40.44415295", "-79.96243993", "edu", "", "2018"], ["Video Object Segmentation with Re-identification", "", "SenseTime", "SenseTime", "China, Beijing Shi, Haidian Qu, WuDaoKou, Zhongguancun E Rd, 1\u53f7-7", "39.99300800", "116.32988200", "company", "1 Zhongguancun E Rd, Haidian Qu, China", "2017"], ["Video captioning with recurrent networks based on frame- and video-level features and visual content classification", "", "Finland", "Finland", "Finland", "61.92411000", "25.74815110", "edu", "", "2015"], ["POL-LWIR Vehicle Detection: Convolutional Neural Networks Meet Polarised Infrared Sensors", "", "Heriot-Watt University", "Heriot-Watt University", "Heriot-Watt University - Edinburgh Campus, Third Gait, Currie, Gogarbank, City of Edinburgh, Scotland, EH14 4AS, UK", "55.91029135", "-3.32345777", "edu", "", "2018"], ["Videos as Space-Time Region Graphs", "", "Robotics Institute", "Robotics Institute", "Institute for Field Robotics, \u0e1b\u0e23\u0e30\u0e0a\u0e32\u0e2d\u0e38\u0e17\u0e34\u0e28, \u0e01\u0e23\u0e38\u0e07\u0e40\u0e17\u0e1e\u0e21\u0e2b\u0e32\u0e19\u0e04\u0e23, \u0e40\u0e02\u0e15\u0e23\u0e32\u0e29\u0e0e\u0e23\u0e4c\u0e1a\u0e39\u0e23\u0e13\u0e30, \u0e01\u0e23\u0e38\u0e07\u0e40\u0e17\u0e1e\u0e21\u0e2b\u0e32\u0e19\u0e04\u0e23, 10140, \u0e1b\u0e23\u0e30\u0e40\u0e17\u0e28\u0e44\u0e17\u0e22", "13.65450525", "100.49423171", "edu", "", "2018"], ["Object Detection via End-to-End Integration of Aspect Ratio and Context Aware Part-based Models and Fully Convolutional Networks", "", "North Carolina State University", "North Carolina State University", "North Carolina State University, Oval Drive, West Raleigh, Raleigh, Wake County, North Carolina, 27695, USA", "35.77184965", "-78.67408695", "edu", "", "2016"], ["Normalized Object Coordinate Space for Category-Level 6D Object Pose and Size Estimation", "", "Princeton University", "Princeton University", "Lot 9, University Place, Princeton Township, Mercer County, New Jersey, 08540, USA", "40.34829285", "-74.66308325", "edu", "", "2019"], ["Face2Text: Collecting an Annotated Image Description Corpus for the Generation of Rich Face Descriptions", "", "University of Copenhagen", "University of Copenhagen", "K\u00f8benhavns Universitet, Krystalgade, K\u00f8dbyen, Vesterbro, K\u00f8benhavn, K\u00f8benhavns Kommune, Region Hovedstaden, 1165, Danmark", "55.68015020", "12.57232700", "edu", "", "2018"], ["Textually Enriched Neural Module Networks for Visual Question Answering", "", "Carnegie Mellon University", "Carnegie Mellon University", "Carnegie Mellon University Silicon Valley, South Akron Road, ARC, Santa Clara County, California, 94035-0016, USA", "37.41021930", "-122.05965487", "edu", "", "2018"], ["Slum Segmentation and Change Detection : A Deep Learning Approach", "", "Indian Institute of Science Bangalore", "Indian Institute of Science Bangalore", "IISc, Gulmohar Marg, RMV Stage II - 1st Block, Aramane Nagara Ward, West Zone, Bengaluru, Bangalore Urban, Karnataka, 560012, India", "13.02223470", "77.56718325", "edu", "", "2018"], ["Input Reconstruction Side and top down view Part Segmentation Input Reconstruction Side and top down view Part Segmentation", "", "University of California, Berkeley", "University of California, Berkeley", "Berkeley Art Museum and Pacific Film Archive, Bancroft Way, Southside, Berkeley, Alameda County, California, 94720-1076, USA", "37.86871260", "-122.25586815", "edu", "", "2017"], ["Large Scale Fine-Grained Categorization and Domain-Specific Transfer Learning", "", "Cornell University", "Cornell University", "Cornell University, Forest Home Drive, Forest Home, Tompkins County, New York, 14853, USA", "42.45055070", "-76.47835130", "edu", "", "2018"], ["Gather-Excite : Exploiting Feature Context in Convolutional Neural Networks", "", "University of Oxford", "University of Oxford", "Radcliffe Camera, Radcliffe Square, Grandpont, Oxford, Oxon, South East, England, OX1 4AJ, UK", "51.75345380", "-1.25400997", "edu", "", "2018"], ["Adversarial Removal of Gender from Deep Image Representations", "", "University of Virginia", "University of Virginia", "University of Virginia, Rotunda Alley, Carr's Hill, Albemarle County, Virginia, 22904-4119, USA", "38.03536820", "-78.50353220", "edu", "", "2018"], ["Regularizing Deep Networks by Modeling and Predicting Label Structure", "", "Toyota Technological Institute at Chicago", "Toyota Technological Institute at Chicago", "6045 S Kenwood Ave, Chicago, IL 60637, USA", "41.78469820", "-87.59258480", "edu", "", "2018"], ["Receptive Field Block Net for Accurate and Fast Object Detection", "", "Beihang University", "Beihang University", "\u5317\u4eac\u822a\u7a7a\u822a\u5929\u5927\u5b66, 37, \u5b66\u9662\u8def, \u4e94\u9053\u53e3, \u540e\u516b\u5bb6, \u6d77\u6dc0\u533a, 100083, \u4e2d\u56fd", "39.98083330", "116.34101249", "edu", "", "2018"], ["SPNet: Superpixel Pyramid Network for Scene Parsing", "Faculty of Information Technology, Beijing University of Technologyy, Beijing, 100124, China", "Beijing University of Technologyy", "Faculty of Information Technology, Beijing University of Technologyy, Beijing, 100124, China", "Chaoyang, China, 100124", "39.87161100", "116.47952900", "edu", "", "2018"], ["Unsupervised Learning of Important Objects from First-Person Videos", "", "University of Pennsylvania", "University of Pennsylvania", "Penn Museum, 3260, South Street, University City, Philadelphia, Philadelphia County, Pennsylvania, 19104, USA", "39.94923440", "-75.19198985", "edu", "", "2017"], ["Gather-Excite: Exploiting Feature Context in Convolutional Neural Networks", "", "University of Oxford", "University of Oxford", "Radcliffe Camera, Radcliffe Square, Grandpont, Oxford, Oxon, South East, England, OX1 4AJ, UK", "51.75345380", "-1.25400997", "edu", "", "2018"], ["Open-vocabulary Phrase Detection", "", "Boston University", "Boston University", "BU, Bay State Road, Fenway, Boston, Suffolk County, Massachusetts, 02215, USA", "42.35042530", "-71.10056114", "edu", "", "2018"], ["SHPD: Surveillance Human Pose Dataset and Performance Evaluation for Coarse-Grained Pose Estimation", "School of Electronic Information and Electrical Engineering, Shanghai Jiao Tong University, Shanghai, 200240, China", "Shanghai Jiao Tong University", "Shanghai Jiao Tong University", "\u4e0a\u6d77\u4ea4\u901a\u5927\u5b66\uff08\u5f90\u6c47\u6821\u533a\uff09, \u6dee\u6d77\u897f\u8def, \u756a\u79ba\u5c0f\u533a, \u5e73\u9634\u6865, \u5f90\u6c47\u533a, \u4e0a\u6d77\u5e02, 200052, \u4e2d\u56fd", "31.20081505", "121.42840681", "edu", "", "2018"], ["Weakly Supervised Vehicle Detection in Satellite Images via Multiple Instance Ranking", "Fujian Key Laboratory of Sensing and Computing for Smart City, School of Information Science and Engineering, Xiamen University, 361005, P. R. China", "Xiamen University", "Xiamen University", "\u53a6\u95e8\u5927\u5b66, \u601d\u660e\u5357\u8def Siming South Road, \u601d\u660e\u533a, \u601d\u660e\u533a (Siming), \u53a6\u95e8\u5e02 / Xiamen, \u798f\u5efa\u7701, 361005, \u4e2d\u56fd", "24.43994190", "118.09301781", "edu", "", "2018"], ["Towards Closing the Gap in Weakly Supervised Semantic Segmentation with DCNNs: Combining Local and Global Models.", "", "ETH Z\u00fcrich", "ETH Z\u00fcrich", "ETH Z\u00fcrich, 101, R\u00e4mistrasse, Hochschulen, Altstadt, Z\u00fcrich, Bezirk Z\u00fcrich, Z\u00fcrich, 8092, Schweiz/Suisse/Svizzera/Svizra", "47.37645340", "8.54770931", "edu", "", "2018"], ["Learning to Interpret Satellite Images Using Wikipedia", "", "Stanford University", "Stanford University", "Stanford University, Memorial Way, Stanford, Santa Clara County, California, 94305-6015, USA", "37.43131385", "-122.16936535", "edu", "", "2018"], ["On the Relation between Color Image Denoising and Classification", "", "Member", "Member", "1322 N Inglewood Ave, Coffeyville, KS 67337, USA", "37.05826350", "-95.67914910", "edu", "", "2017"], ["Pixel-wise object tracking", "", "New York University", "New York University", "NYU, West 4th Street, NoHo Historic District, NoHo, Manhattan, Manhattan Community Board 2, New York County, NYC, New York, 10012, USA", "40.72925325", "-73.99625394", "edu", "", "2017"], ["Face Detection Using Improved Faster RCNN", "", "China", "China", "China", "35.86166000", "104.19539700", "edu", "", "2018"], ["CNN+CNN: Convolutional Decoders for Image Captioning", "", "City University of Hong Kong", "City University of Hong Kong", "\u9999\u6e2f\u57ce\u5e02\u5927\u5b78 City University of Hong Kong, \u9054\u5eb7\u8def Tat Hong Avenue, \u5927\u7aa9\u576a Tai Wo Ping, \u6df1\u6c34\u57d7\u5340 Sham Shui Po District, \u4e5d\u9f8d Kowloon, HK, KIL 3348, \u4e2d\u56fd", "22.34000115", "114.16970291", "edu", "", "2018"], ["Neurons Merging Layer: Towards Progressive Redundancy Reduction for Deep Supervised Hashing", "", "University of Chinese Academy of Sciences", "University of Chinese Academy of Sciences", "University of Chinese Academy of Sciences, UCAS, Yuquanlu, \u7389\u6cc9\u8def, \u7530\u6751, \u6d77\u6dc0\u533a, 100049, \u4e2d\u56fd", "39.90828040", "116.24585270", "edu", "", "2018"], ["Learning Semantic Segmentation from Synthetic Data: A Geometrically Guided Input-Output Adaptation Approach", "", "ETH Zurich", "Computer Vision Laboratory, ETH Zurich, Zurich, Switzerland", "Sternwartstrasse 7, 8092 Z\u00fcrich, Switzerland", "47.37723980", "8.55216180", "edu", "", "2018"], ["End-to-End Airplane Detection Using Transfer Learning in Remote Sensing Images", "", "China", "China", "China", "35.86166000", "104.19539700", "edu", "", "2018"], ["Playing for Benchmarks", "", "TU Darmstadt", "TU Darmstadt", "Karolinenpl. 5, 64289 Darmstadt, Germany", "49.87482770", "8.65632810", "edu", "", "2017"], ["Advances in deep learning approaches for image tagging", "", "Microsoft", "Microsoft", "7021 S Memorial Dr, Tulsa, OK 74133, USA", "36.06303740", "-95.88099660", "edu", "", "2017"], ["Multimodal Compact Bilinear Pooling for Visual Question Answering and Visual Grounding", "", "Max Planck Institute for Informatics", "Max Planck Institute for Informatics", "MPII, E1 4, Campus, Universit\u00e4t, Sankt Johann, Bezirk Mitte, Saarbr\u00fccken, Regionalverband Saarbr\u00fccken, Saarland, 66123, Deutschland", "49.25795660", "7.04577417", "edu", "", "2016"], ["What Makes for Effective Detection Proposals?", "", "Max Planck Institute for Informatics", "Max Planck Institute for Informatics", "MPII, E1 4, Campus, Universit\u00e4t, Sankt Johann, Bezirk Mitte, Saarbr\u00fccken, Regionalverband Saarbr\u00fccken, Saarland, 66123, Deutschland", "49.25795660", "7.04577417", "edu", "", "2016"], ["A cascaded long short-term memory (LSTM) driven generic visual question answering (VQA)", "Queensland University of Technology", "Queensland University of Technology", "Queensland University of Technology", "Queensland University of Technology, Macgregor Lane, Merthyr, South Brisbane, Brisbane, QLD, 4000, Australia", "-27.47715625", "153.02841004", "edu", "", "2017"], ["Adaptive Object Detection Using Adjacency and Zoom Prediction", "", "University of Illinois, Urbana-Champaign", "University of Illinois, Urbana-Champaign", "B-3, South Mathews Avenue, Urbana, Champaign County, Illinois, 61801, USA", "40.11116745", "-88.22587665", "edu", "", "2016"], ["ISIA at the ImageCLEF 2017 Image Caption Task", "", "China", "China", "China", "35.86166000", "104.19539700", "edu", "", "2017"], ["Shallow and Deep Convolutional Networks for Saliency Prediction", "", "Dublin City University", "DUBLIN CITY UNIVERSITY", "Dublin City University Glasnevin Campus, Lower Car Park, Wad, Whitehall A ED, Dublin 9, Dublin, County Dublin, Leinster, D09 FW22, Ireland", "53.38522185", "-6.25740874", "edu", "", "2016"], ["Self-Supervised Learning of Visual Features through Embedding Images into Text Topic Spaces", "", "CVIT, KCIS, IIIT Hyderabad, India", "CVIT, KCIS, IIIT Hyderabad, India", "IIIT, Gachibowli, Gachibowli, Hyderabad, Telangana 500032, India", "17.44509810", "78.34976780", "edu", "", "2017"], ["Backdoor Embedding in Convolutional Neural Network Models via Invisible Perturbation", "", "Pennsylvania State University", "Pennsylvania State University", "", "", "", "edu", "", "2018"], ["Pixel Objectness", "", "University of Texas at Austin", "University of Texas at Austin", "University of Texas at Austin, 1, East 23rd Street, The Drag, Austin, Travis County, Texas, 78712, USA", "30.28415100", "-97.73195598", "edu", "", "2017"], ["Semi-automatic video object segmentation by advanced manipulation of segmentation hierarchies", "Disney Research Zurich", "Disney Research Zurich", "Disney Research Zurich", "Stampfenbachstrasse 48, 8006 Z\u00fcrich, Switzerland", "47.38047690", "8.54299640", "company", "", "2015"], ["VADRA: Visual Adversarial Domain Randomization and Augmentation", "", "Carnegie Mellon University", "Carnegie Mellon University", "Carnegie Mellon University Silicon Valley, South Akron Road, ARC, Santa Clara County, California, 94035-0016, USA", "37.41021930", "-122.05965487", "edu", "", "2018"], ["Zero-Shot Object Detection", "", "SRI International", "SRI International", "SRI International Building, West 1st Street, Menlo Park, San Mateo County, California, 94025, USA", "37.45857960", "-122.17560525", "edu", "", "2018"], ["Directional Edge Boxes: Exploiting Inner Normal Direction Cues for Effective Object Proposal Generation", "School of Electronic Information and Communications, Huazhong University of Science and Technology, Wuhan, China", "Huazhong University of Science and Technology", "Huazhong University of Science and Technology", "\u534e\u4e2d\u5927, \u73de\u55bb\u8def, \u4e1c\u6e56\u65b0\u6280\u672f\u5f00\u53d1\u533a, \u5173\u4e1c\u8857\u9053, \u4e1c\u6e56\u65b0\u6280\u672f\u5f00\u53d1\u533a\uff08\u6258\u7ba1\uff09, \u6d2a\u5c71\u533a (Hongshan), \u6b66\u6c49\u5e02, \u6e56\u5317\u7701, 430074, \u4e2d\u56fd", "30.50975370", "114.40628810", "edu", "", "2017"], ["Cut, Paste and Learn: Surprisingly Easy Synthesis for Instance Detection", "", "Carnegie Mellon University", "Carnegie Mellon University", "Carnegie Mellon University Silicon Valley, South Akron Road, ARC, Santa Clara County, California, 94035-0016, USA", "37.41021930", "-122.05965487", "edu", "", "2017"], ["On the Effects of Spam Filtering and Incremental Learning for Web-Supervised Visual Concept Classification", "German National Library of Science and Technology & Leibniz Universit\u00e4t Hannover, Hannover, Germany", "German National Library of Science and Technology & Leibniz Universit\u00e4t Hannover, Hannover, Germany", "German National Library of Science and Technology & Leibniz Universit\u00e4t Hannover, Hannover, Germany", "TIB-Standort Technik/Naturwissenschaften, Welfengarten 1B, 30167 Hannover, Germany", "52.38151500", "9.72017100", "edu", "", "2016"], ["Learning Visually-Grounded Semantics from Contrastive Adversarial Samples", "", "Tsinghua University", "Tsinghua University", "\u6e05\u534e\u5927\u5b66, 30, \u53cc\u6e05\u8def, \u4e94\u9053\u53e3, \u540e\u516b\u5bb6, \u6d77\u6dc0\u533a, 100084, \u4e2d\u56fd", "40.00229045", "116.32098908", "edu", "", "2018"], ["Generation and Comprehension of Unambiguous Object Descriptions", "", "University of Oxford", "University of Oxford", "Radcliffe Camera, Radcliffe Square, Grandpont, Oxford, Oxon, South East, England, OX1 4AJ, UK", "51.75345380", "-1.25400997", "edu", "", "2016"], ["Visual Question Answering Dataset for Bilingual Image Understanding: A Study of Cross-Lingual Transfer Using Attention Maps", "", "Tokyo Institute of Technology", "Tokyo Institute of Technology", "\u6771\u4eac\u5de5\u696d\u5927\u5b66, \u539a\u6728\u8857\u9053, \u7dd1\u533a, \u753a\u7530\u5e02, \u795e\u5948\u5ddd\u770c, \u95a2\u6771\u5730\u65b9, 226-0026, \u65e5\u672c", "35.51675380", "139.48342251", "edu", "", "2018"], ["Event Specific Multimodal Pattern Mining for Knowledge Base Construction", "Rensselaer Polytechnic Institute, Troy, NY, USA", "Rensselaer Polytechnic Institute", "Rensselaer Polytechnic Institute", "Rensselaer Polytechnic Institute, Sage Avenue, Downtown, City of Troy, Rensselaer County, New York, 12180, USA", "42.72984590", "-73.67950216", "edu", "", "2016"], ["Bachelor Project Image Captioning with Convolutional Neural Networks", "", "Czech Technical University", "Czech Technical University", "\u010cesk\u00e9 vysok\u00e9 u\u010den\u00ed technick\u00e9 v Praze, Resslova, Nov\u00e9 M\u011bsto, Praha, okres Hlavn\u00ed m\u011bsto Praha, Hlavn\u00ed m\u011bsto Praha, Praha, 11121, \u010cesko", "50.07642960", "14.41802312", "edu", "", "2017"], ["Asking for Help with the Right Question by Predicting Human Visual Performance", "", "University of California, Santa Barbara", "University of California, Santa Barbara", "UCSB, Santa Barbara County, California, 93106, USA", "34.41459370", "-119.84581950", "edu", "", "2016"], ["What value high level concepts in vision to language problems ?", "", "University of Adelaide", "University of Adelaide", "University of Adelaide, North Terrace, Adelaide, 5000, City of Adelaide, South Australia, 5000, Australia", "-34.91892260", "138.60423668", "edu", "", "2015"], ["Training Deep Networks with Structured Layers by Matrix Backpropagation", "", "University of Bonn", "University of Bonn", "Rheinische Friedrich-Wilhelms-Universit\u00e4t Bonn, Arkadenhof, Bonn-Zentrum, Stadtbezirk Bonn, Bonn, Regierungsbezirk K\u00f6ln, Nordrhein-Westfalen, 53113, Deutschland", "50.73381240", "7.10224650", "edu", "", "2015"], ["TRAFFIC ANALYSIS USING VISUAL OBJECT DETECTION AND TRACKING", "", "University of Chinese Academy of Sciences", "University of Chinese Academy of Sciences", "University of Chinese Academy of Sciences, UCAS, Yuquanlu, \u7389\u6cc9\u8def, \u7530\u6751, \u6d77\u6dc0\u533a, 100049, \u4e2d\u56fd", "39.90828040", "116.24585270", "edu", "", "2017"], ["Fast Neural Architecture Search of Compact Semantic Segmentation Models via Auxiliary Cells.", "", "University of Adelaide", "University of Adelaide", "University of Adelaide, North Terrace, Adelaide, 5000, City of Adelaide, South Australia, 5000, Australia", "-34.91892260", "138.60423668", "edu", "", "2018"], ["Image captioning based on deep reinforcement learning", "", "China", "China", "China", "35.86166000", "104.19539700", "edu", "", "2018"], ["What Action Causes This? Towards Naive Physical Action-Effect Prediction", "", "Microsoft", "Microsoft", "7021 S Memorial Dr, Tulsa, OK 74133, USA", "36.06303740", "-95.88099660", "edu", "", "2018"], ["Controllable Top-down Feature Transformer", "", "University of California, San Diego", "University of California, San Diego", "UCSD, 9500, Gilman Drive, Sixth College, University City, San Diego, San Diego County, California, 92093, USA", "32.87935255", "-117.23110049", "edu", "", "2017"], ["Natural Language Driven Image Edits using a Semantic Image Manipulation Language (SIMPL)", "", "Virginia Tech", "Virginia Polytechnic Institute and State University", "Virginia Polytechnic Institute and State University, Duck Pond Drive, Blacksburg, Montgomery County, Virginia, 24061-9517, USA", "37.21872455", "-80.42542519", "edu", "", "2018"], ["The Impact of Visual Saliency Prediction in Image Classification", "", "Dublin City University", "DUBLIN CITY UNIVERSITY", "Dublin City University Glasnevin Campus, Lower Car Park, Wad, Whitehall A ED, Dublin 9, Dublin, County Dublin, Leinster, D09 FW22, Ireland", "53.38522185", "-6.25740874", "edu", "", "2017"], ["Oracle Performance for Visual Captioning", "", "New York University", "New York University", "NYU, West 4th Street, NoHo Historic District, NoHo, Manhattan, Manhattan Community Board 2, New York County, NYC, New York, 10012, USA", "40.72925325", "-73.99625394", "edu", "", "2016"], ["Linguistic Unit Discovery from Multi-Modal Inputs in Unwritten Languages: Summary of the \u201cSpeaking Rosetta\u201d JSALT 2017 Workshop", "", "University of Illinois, Urbana-Champaign", "University of Illinois, Urbana-Champaign", "B-3, South Mathews Avenue, Urbana, Champaign County, Illinois, 61801, USA", "40.11116745", "-88.22587665", "edu", "", "2018"], ["Boosted Attention: Leveraging Human Attention for Image Captioning", "", "University of Minnesota", "University of Minnesota", "WeismanArt, 333, East River Parkway, Marcy-Holmes, Phillips, Minneapolis, Hennepin County, Minnesota, 55455, USA", "44.97308605", "-93.23708813", "edu", "", "2018"], ["Social Image Captioning: Exploring Visual Attention and User Attention", "", "China", "China", "China", "35.86166000", "104.19539700", "edu", "", "2018"], ["Road Damage Detection And Classification In Smartphone Captured Images Using Mask R-CNN", "", "India", "India", "India", "20.59368400", "78.96288000", "edu", "", "2018"], ["Fast Efficient Object Detection Using Selective Attention", "", "University of Sydney", "University of Sydney", "USyd, Fisher Road, Camperdown, Sydney, NSW, 2006, Australia", "-33.88890695", "151.18943366", "edu", "", "2018"], ["ScratchDet: Exploring to Train Single-Shot Object Detectors from Scratch", "", "University of Chinese Academy of Sciences", "University of Chinese Academy of Sciences", "University of Chinese Academy of Sciences, UCAS, Yuquanlu, \u7389\u6cc9\u8def, \u7530\u6751, \u6d77\u6dc0\u533a, 100049, \u4e2d\u56fd", "39.90828040", "116.24585270", "edu", "", "2018"], ["Design Pseudo Ground Truth with Motion Cue for Unsupervised Video Object Segmentation.", "", "National Taiwan University", "National Taiwan University", "\u81fa\u5927;\u53f0\u5927, 1, \u7f85\u65af\u798f\u8def\u56db\u6bb5, \u5b78\u5e9c\u91cc, \u5927\u5b89\u5340, \u81fa\u5317\u5e02, 10617, \u81fa\u7063", "25.01682835", "121.53846924", "edu", "", "2018"], ["Partially-Supervised Image Captioning", "", "Australian National University", "Australian National University", "Canberra ACT 0200, Australia", "-35.27769990", "149.11852700", "edu", "", "2018"], ["Rank of Experts: Detection Network Ensemble", "", "Electronics and Telecommunications Research Institute, Daejeon, South Korea", "Electronics and Telecommunications Research Institute, Daejeon, South Korea", "Electronics and Telecommunications Research Institute, Sinseong-dong, Daejeon, South Korea", "36.38376500", "127.36694000", "edu", "", "2017"], ["Emergent Translation in Multi-Agent Communication", "", "New York University", "New York University", "NYU, West 4th Street, NoHo Historic District, NoHo, Manhattan, Manhattan Community Board 2, New York County, NYC, New York, 10012, USA", "40.72925325", "-73.99625394", "edu", "", "2017"], ["Tag-based video retrieval by embedding semantic content in a continuous word space", "", "University of Amsterdam", "University of Amsterdam", "Institute for Logic, Language and Computation (ILLC), 107, Science Park, Oost-Watergraafsmeer, Amsterdam, Oost, Amsterdam, Noord-Holland, Nederland, 1098XG, Nederland", "52.35536550", "4.95016440", "edu", "", "2016"], ["FastMask: Segment Multi-scale Object Candidates in One Shot", "", "Fudan University", "Fudan University", "\u590d\u65e6\u5927\u5b66, 220, \u90af\u90f8\u8def, \u4e94\u89d2\u573a\u8857\u9053, \u6768\u6d66\u533a, \u4e0a\u6d77\u5e02, 200433, \u4e2d\u56fd", "31.30104395", "121.50045497", "edu", "", "2017"], ["Beyond Pixels: A Comprehensive Survey from Bottom-up to Semantic Image Segmentation and Cosegmentation", "", "Nanyang Technological University", "Nanyang Technological University", "NTU, Faculty Avenue, Jurong West, Southwest, 637460, Singapore", "1.34841040", "103.68297965", "edu", "", "2016"], ["Looking at Hands in Autonomous Vehicles: A ConvNet Approach using Part Affinity Fields", "", "University of California, San Diego", "University of California, San Diego", "UCSD, 9500, Gilman Drive, Sixth College, University City, San Diego, San Diego County, California, 92093, USA", "32.87935255", "-117.23110049", "edu", "", "2018"], ["Learning visual attribute from image and text \u2217", "", "Tohoku University", "Tohoku University", "Tohoku University, \u4e94\u6a4b\u901a, \u9752\u8449\u533a, \u4ed9\u53f0\u5e02, \u5bae\u57ce\u770c, \u6771\u5317\u5730\u65b9, 980-0811, \u65e5\u672c", "38.25309450", "140.87365930", "edu", "", "2015"], ["Adopting Abstract Images for Semantic Scene Understanding", "Microsoft Research, One Microsoft Way, Redmond, WA", "Microsoft", "Microsoft", "7021 S Memorial Dr, Tulsa, OK 74133, USA", "36.06303740", "-95.88099660", "edu", "", "2016"], ["Tackling Low Resolution for Better Scene Understanding", "", "India", "India", "India", "20.59368400", "78.96288000", "edu", "", "2018"], ["Add English to image Chinese captioning", "PDL, National Laboratory for Parallel and Distributed Processing, NUDT, National University of Defense Technology, Changsha, China", "National University of Defense Technology, China", "National University of Defence Technology, Changsha 410000, China", "\u56fd\u9632\u79d1\u5b66\u6280\u672f\u5927\u5b66, \u4e09\u4e00\u5927\u9053, \u5f00\u798f\u533a, \u5f00\u798f\u533a (Kaifu), \u957f\u6c99\u5e02 / Changsha, \u6e56\u5357\u7701, 410073, \u4e2d\u56fd", "28.22902090", "112.99483204", "edu", "", "2017"], ["Image Captioning with Scene-graph Based Semantic Concepts", "School of ECE, Peking University Shenzhen Graduate School, Shenzhen, China", "China", "China", "China", "35.86166000", "104.19539700", "edu", "", "2018"], ["Deep Generative Models for Weakly-Supervised Multi-Label Classification", "", "Carnegie Mellon University", "Carnegie Mellon University", "Carnegie Mellon University Silicon Valley, South Akron Road, ARC, Santa Clara County, California, 94035-0016, USA", "37.41021930", "-122.05965487", "edu", "", "2018"], ["Visual Question Answering : Datasets , Methods , Challenges and Oppurtunities", "", "Princeton University", "Princeton University", "Lot 9, University Place, Princeton Township, Mercer County, New Jersey, 08540, USA", "40.34829285", "-74.66308325", "edu", "", "2018"], ["Active Grounding of Visual Situations", "", "Santa Fe Institute", "Santa Fe Institute", "Santa Fe Institute, Hyde Park Road, Santa Fe, Santa Fe County, New Mexico, 87501, USA", "35.70028780", "-105.90864847", "edu", "", "2017"], ["ABC-CNN: An Attention Based Convolutional Neural Network for Visual Question Answering", "", "University of Southern California", "University of Southern California", "University of Southern California, Watt Way, Saint James Park, LA, Los Angeles County, California, 90089, USA", "34.02241490", "-118.28634407", "edu", "", "2015"], ["A New Deep Learning-Based Food Recognition System for Dietary Assessment on An Edge Computing Service Infrastructure", "University of Massachusetts, Lowell, MA", "University of Massachusetts", "University of Massachusetts", "University of Massachusetts, Hicks Way, Amherst, Hampshire, Massachusetts, 01003, USA", "42.38897850", "-72.52869870", "edu", "", "2018"], ["Complex event processing for content-based text, image, and video retrieval", "United States Air Force Research Laboratory, Dayton, OH", "United States Air Force Research Laboratory, Dayton, OH", "United States Air Force Research Laboratory, Dayton, OH", "1864 4th St, Wright-Patterson AFB, OH 45433, USA", "39.79084110", "-84.09897580", "edu", "", "2016"], ["Non-parametric Structured Output Networks", "", "Disney Research", "Disney Research", "521 Circle 7 Dr, Glendale, CA 91201, USA", "34.15797420", "-118.28947290", "edu", "", "2017"], ["A Rotation Invariant Latent Factor Model for Moveme Discovery from Static Poses", "", "California Institute of Technology", "California Institute of Technology", "California Institute of Technology, San Pasqual Walk, Madison Heights, Pasadena, Los Angeles County, California, 91126, USA", "34.13710185", "-118.12527487", "edu", "", "2016"], ["Bidirectional Long-Short Term Memory for Video Description", "", "University of Queensland", "University of Queensland", "University of Queensland, University Drive, Hill End, St Lucia, Brisbane, QLD, 4072, Australia", "-27.49741805", "153.01316956", "edu", "", "2016"], ["Recurrent Topic-Transition GAN for Visual Paragraph Generation", "", "Carnegie Mellon University", "Carnegie Mellon University", "Carnegie Mellon University Silicon Valley, South Akron Road, ARC, Santa Clara County, California, 94035-0016, USA", "37.41021930", "-122.05965487", "edu", "", "2017"], ["Beyond Forward Shortcuts: Fully Convolutional Master-Slave Networks (MSNets) with Backward Skip Connections for Semantic Segmentation", "", "University of Illinois, Urbana-Champaign", "University of Illinois, Urbana-Champaign", "B-3, South Mathews Avenue, Urbana, Champaign County, Illinois, 61801, USA", "40.11116745", "-88.22587665", "edu", "", "2017"], ["A Reinforcement Learning Framework for Natural Question Generation using Bi-discriminators", "", "Fudan University", "Fudan University", "\u590d\u65e6\u5927\u5b66, 220, \u90af\u90f8\u8def, \u4e94\u89d2\u573a\u8857\u9053, \u6768\u6d66\u533a, \u4e0a\u6d77\u5e02, 200433, \u4e2d\u56fd", "31.30104395", "121.50045497", "edu", "", "2018"], ["VSE++: Improving Visual-Semantic Embeddings with Hard Negatives", "", "University of Toronto", "University of Toronto", "University of Toronto, St. George Street, Bloor Street Culture Corridor, Old Toronto, Toronto, Ontario, M5S 1A5, Canada", "43.66333345", "-79.39769975", "edu", "", "2018"], ["Accelerating Machine Learning Inference with Probabilistic Predicates", "Princeton University &Microsoft, Princeton, NJ, USA", "Microsoft, Redmond, WA, USA", "Microsoft, Redmond, WA, USA", "5000 148th Ave NE, Redmond, WA 98052, USA", "47.65292200", "-122.14223560", "edu", "", "2018"], ["Actor-Critic Sequence Training for Image Captioning", "", "University of Edinburgh", "University of Edinburgh", "New College, New College Courtyard, The Mound, Old Town, Edinburgh, City of Edinburgh, Scotland, EH1 2LX, UK", "55.94951105", "-3.19534913", "edu", "", "2017"], ["Stories in the Eye: Contextual Visual Interactions for Efficient Video to Language Translation", "", "Romania", "Romania", "Romania", "45.94316100", "24.96676000", "edu", "", "2015"], ["Neural Image Captioning for Intelligent Vehicle-to-Passenger Communication", "", "Stanford University", "Stanford University", "Stanford University, Memorial Way, Stanford, Santa Clara County, California, 94305-6015, USA", "37.43131385", "-122.16936535", "edu", "", "2017"], ["Hybrid Supervised-unsupervised Image Topic Visualization with Convolutional Neural Network and LDA", "", "Indiana University", "Indiana University", "Indiana University East, West Cart Road, Richmond, Wayne County, Indiana, 47374, USA", "39.86948105", "-84.87956905", "edu", "", "2017"], ["Cross-linguistic differences and similarities in image descriptions", "", "University of Edinburgh", "University of Edinburgh", "New College, New College Courtyard, The Mound, Old Town, Edinburgh, City of Edinburgh, Scotland, EH1 2LX, UK", "55.94951105", "-3.19534913", "edu", "", "2017"], ["Comixify: Transform video into a comics", "", "Warsaw University of Technology", "Warsaw University of Technology", "Politechnika Warszawska, 1, Plac Politechniki, VIII, \u015ar\u00f3dmie\u015bcie, Warszawa, mazowieckie, 00-661, RP", "52.22165395", "21.00735776", "edu", "", "2018"], ["Fine-grained Video Retrieval using Query Phrases \u2014 Waseda_Meisei TRECVID 2017 AVS System \u2014", "Faculty of Science and Engineering, Waseda University, Tokyo, 162-0042, Japan", "Waseda University", "Waseda University", "\u65e9\u7a32\u7530\u5927\u5b66 \u5317\u4e5d\u5dde\u30ad\u30e3\u30f3\u30d1\u30b9, 2-2, \u6709\u6bdb\u5f15\u91ce\u7dda, \u516b\u5e61\u897f\u533a, \u5317\u4e5d\u5dde\u5e02, \u798f\u5ca1\u770c, \u4e5d\u5dde\u5730\u65b9, 808-0135, \u65e5\u672c", "33.88987280", "130.70856205", "edu", "", "2018"], ["DSOD: Learning Deeply Supervised Object Detectors from Scratch", "", "Fudan University", "Fudan University", "\u590d\u65e6\u5927\u5b66, 220, \u90af\u90f8\u8def, \u4e94\u89d2\u573a\u8857\u9053, \u6768\u6d66\u533a, \u4e0a\u6d77\u5e02, 200433, \u4e2d\u56fd", "31.30104395", "121.50045497", "edu", "", "2017"], ["Detecting Animals in Infrared Images from Camera-Traps", "Research, MVTec Software GmbH, Munich, Germany", "Technical University of Munich", "Computer Aided Medical Procedures, Technical University of Munich, Garching, Germany", "Boltzmannstra\u00dfe 3, 85748 Garching bei M\u00fcnchen, Germany", "48.26301100", "11.66685700", "edu", "", "2018"], ["PIRC Net : Using Proposal Indexing, Relationships and Context for Phrase Grounding", "", "University of Southern California", "University of Southern California", "University of Southern California, Watt Way, Saint James Park, LA, Los Angeles County, California, 90089, USA", "34.02241490", "-118.28634407", "edu", "", "2018"], ["Learning Unsupervised Visual Grounding Through Semantic Self-Supervision.", "", "Carnegie Mellon University", "Carnegie Mellon University", "Carnegie Mellon University Silicon Valley, South Akron Road, ARC, Santa Clara County, California, 94035-0016, USA", "37.41021930", "-122.05965487", "edu", "", "2018"], ["Title Multi-Object Classification and Unsupervised Scene Understanding Using Deep Learning Features and Latent Tree Probabilistic Models Permalink", "", "a", "a", "Independence, KS 67301, USA", "37.09024000", "-95.71289100", "edu", "", "2015"], ["Recurrent Pixel Embedding for Instance Grouping", "", "University of California, Irvine", "University of California, Irvine", "University of California, Irvine, East Peltason Drive, Turtle Rock, Irvine, Orange County, California, 92612, USA", "33.64319010", "-117.84016494", "edu", "", "2018"], ["Distorting Neural Representations to Generate Highly Transferable Adversarial Examples", "", "Australian National University", "Australian National University", "Canberra ACT 0200, Australia", "-35.27769990", "149.11852700", "edu", "", "2018"], ["Neural Motifs: Scene Graph Parsing with Global Context", "", "Carnegie Mellon University", "Carnegie Mellon University", "Carnegie Mellon University Silicon Valley, South Akron Road, ARC, Santa Clara County, California, 94035-0016, USA", "37.41021930", "-122.05965487", "edu", "", "2018"], ["Artistic Image Generation from Sketch by Using Conditional Adversarial Network and Style Feature Transform", "", "Wuhan University of Technology", "Wuhan University of Technology", "\u6b66\u6c49\u7406\u5de5\u5927\u5b66-\u4f59\u5bb6\u5934\u6821\u533a, \u4ea4\u901a\u4e8c\u8def, \u6768\u56ed\u8857\u9053, \u6b66\u660c\u533a (Wuchang), \u6b66\u6c49\u5e02, \u6e56\u5317\u7701, 430062, \u4e2d\u56fd", "30.60903415", "114.35142840", "edu", "", "2018"], ["C-WSL: Count-Guided Weakly Supervised Localization", "", "University of Maryland", "University of Maryland", "The Grand Garage, 5, North Paca Street, Seton Hill, Baltimore, Maryland, 21201, USA", "39.28996850", "-76.62196103", "edu", "", "2018"], ["Non-local RoI for Cross-Object Perception", "", "National Tsing Hua University", "National Tsing Hua University", "\u570b\u7acb\u6e05\u83ef\u5927\u5b78, 101, \u514b\u606d\u6a4b, \u5149\u660e\u91cc, \u8d64\u571f\u5d0e, \u6771\u5340, \u65b0\u7af9\u5e02, 30013, \u81fa\u7063", "24.79254840", "120.99511830", "edu", "", "2018"], ["Learning from Multiview Correlations in Open-Domain Videos", "", "Imperial College London", "Imperial College London", "Imperial College London, Exhibition Road, Brompton, Royal Borough of Kensington and Chelsea, London, Greater London, England, SW7 2AZ, UK", "51.49887085", "-0.17560797", "edu", "", "2018"], ["Exploring the Design Space of Deep Convolutional Neural Networks at Large Scale", "", "University of California, Berkeley", "University of California, Berkeley", "Berkeley Art Museum and Pacific Film Archive, Bancroft Way, Southside, Berkeley, Alameda County, California, 94720-1076, USA", "37.86871260", "-122.25586815", "edu", "", "2016"], ["BING++: A Fast High Quality Object Proposal Generator at 100fps", "", "China", "China", "China", "35.86166000", "104.19539700", "edu", "", "2015"], ["Actor-Action Semantic Segmentation with Region Masks", "", "Wuhan University of Technology", "Wuhan University of Technology", "\u6b66\u6c49\u7406\u5de5\u5927\u5b66-\u4f59\u5bb6\u5934\u6821\u533a, \u4ea4\u901a\u4e8c\u8def, \u6768\u56ed\u8857\u9053, \u6b66\u660c\u533a (Wuchang), \u6b66\u6c49\u5e02, \u6e56\u5317\u7701, 430062, \u4e2d\u56fd", "30.60903415", "114.35142840", "edu", "", "2018"], ["4D Generic Video Object Proposals", "", "RWTH Aachen University", "RWTH Aachen University", "RWTH Aachen, Mies-van-der-Rohe-Stra\u00dfe, K\u00f6nigsh\u00fcgel, Aachen-Mitte, Aachen, St\u00e4dteregion Aachen, Regierungsbezirk K\u00f6ln, Nordrhein-Westfalen, 52074, Deutschland", "50.77917030", "6.06728733", "edu", "", "2019"], ["Self-Supervised Adversarial Hashing Networks for Cross-Modal Retrieval", "", "University of Sydney", "University of Sydney", "USyd, Fisher Road, Camperdown, Sydney, NSW, 2006, Australia", "-33.88890695", "151.18943366", "edu", "", "2018"], ["Active Transfer Learning with Zero-Shot Priors: Reusing Past Datasets for Future Tasks", "", "University of Amsterdam", "University of Amsterdam", "Institute for Logic, Language and Computation (ILLC), 107, Science Park, Oost-Watergraafsmeer, Amsterdam, Oost, Amsterdam, Noord-Holland, Nederland, 1098XG, Nederland", "52.35536550", "4.95016440", "edu", "", "2015"], ["Question Part Relevance and Editing for Cooperative and Context-Aware VQA (C2VQA)", "Universit\u00e0 di Salerno, Dipartimento di Informatica, Fisciano, Italy", "George Mason University", "George Mason University", "George Mason University, Aquia Creek Lane, Country Club View, Blue Oaks, Fairfax County, Virginia, 22030-9998, USA", "38.83133325", "-77.30798839", "edu", "", "2017"], ["Finding Tiny Faces", "", "Carnegie Mellon University", "Carnegie Mellon University", "Carnegie Mellon University Silicon Valley, South Akron Road, ARC, Santa Clara County, California, 94035-0016, USA", "37.41021930", "-122.05965487", "edu", "", "2017"], ["Multiview Cross-supervision for Semantic Segmentation", "", "University of Minnesota", "University of Minnesota", "WeismanArt, 333, East River Parkway, Marcy-Holmes, Phillips, Minneapolis, Hennepin County, Minnesota, 55455, USA", "44.97308605", "-93.23708813", "edu", "", "2018"], ["Asymmetric Deep Supervised Hashing", "", "Nanjing University", "Nanjing University", "NJU, \u4e09\u6c5f\u8def, \u9f13\u697c\u533a, \u5357\u4eac\u5e02, \u6c5f\u82cf\u7701, 210093, \u4e2d\u56fd", "32.05659570", "118.77408833", "edu", "", "2018"], ["Simple Baseline for Visual Question Answering", "", "MIT", "Massachusetts Institute", "MIT, Amherst Street, Cambridgeport, Cambridge, Middlesex County, Massachusetts, 02238, USA", "42.35839610", "-71.09567788", "edu", "", "2015"], ["SPICE: Semantic Propositional Image Caption Evaluation", "", "Macquarie University", "Macquarie University, Sydney, Australia", "Balaclava Rd, Macquarie Park NSW 2109, Australia", "-33.77382370", "151.11264980", "edu", "", "2016"], ["Image Captioning with Text-Based Visual Attention", "School of Electronics and Information Engineering, Sun Yat-sen University, Guangzhou, China", "Sun Yat-Sen University", "Sun Yat-Sen University", "\u4e2d\u5927, \u65b0\u6e2f\u897f\u8def, \u9f99\u8239\u6ed8, \u5eb7\u4e50, \u6d77\u73e0\u533a (Haizhu), \u5e7f\u5dde\u5e02, \u5e7f\u4e1c\u7701, 510105, \u4e2d\u56fd", "23.09461185", "113.28788994", "edu", "", "2018"], ["CBAM: Convolutional Block Attention Module", "", "Korea Advanced Institute of Science and Technology", "Korea Advanced Institute of Science and Technology", "\uce74\uc774\uc2a4\ud2b8, 291, \ub300\ud559\ub85c, \uc628\ucc9c2\ub3d9, \uc628\ucc9c\ub3d9, \uc720\uc131\uad6c, \ub300\uc804, 34141, \ub300\ud55c\ubbfc\uad6d", "36.36971910", "127.36253700", "edu", "", "2018"], ["Panoptic Segmentation with a Joint Semantic and Instance Segmentation Network", "", "TU Eindhoven", "TU Eindhoven", "Technische Universiteit Eindhoven, 2, De Rondom, Villapark, Eindhoven, Noord-Brabant, Nederland, 5600 MB, Nederland", "51.44866020", "5.49039957", "edu", "", "2018"], ["Semantic soft segmentation", "MIT CSAIL and ETH Z\u00fcrich, Switzerland", "MIT CSAIL", "MIT CSAIL", "32 Vassar St, Cambridge, MA 02139, USA", "42.36194070", "-71.09043780", "edu", "", "2018"], ["Identifying implementation bugs in machine learning based image classifiers using metamorphic testing", "", "India", "India", "India", "20.59368400", "78.96288000", "edu", "", "2018"], ["The neural network image captioning model based on adversarial training", "", "Russia", "Russia", "Russia", "61.52401000", "105.31875600", "edu", "", "2018"], ["Semantic Segmentation , Urban Navigation , and Research Directions", "", "Princeton University", "Princeton University", "Lot 9, University Place, Princeton Township, Mercer County, New Jersey, 08540, USA", "40.34829285", "-74.66308325", "edu", "", "2018"], ["Implementation of human-robot VQA interaction system with dynamic memory networks", "School of Electrical Engineering, KAIST, Daejeon, Republic of Korea", "KAIST", "KAIST", "291 Daehak-ro, Eoeun-dong, Yuseong-gu, Daejeon, South Korea", "36.37214270", "127.36039000", "edu", "", "2017"], ["Adversarial Cross-Modal Retrieval", "University of Electronic Science and Technology of China, Chengdu, China", "University of Electronic Science and Technology of China", "University of Electronic Science and Technology of China", "Columbus, OH 43210, USA", "40.01419050", "-83.03091430", "edu", "", "2017"], ["Data Analysis Project : Using Knowledge Graphs for Image Classification", "", "Carnegie Mellon University", "Carnegie Mellon University", "Carnegie Mellon University Silicon Valley, South Akron Road, ARC, Santa Clara County, California, 94035-0016, USA", "37.41021930", "-122.05965487", "edu", "", "2018"], ["Structure Inference Net: Object Detection Using Scene-Level Context and Instance-Level Relationships", "", "China", "China", "China", "35.86166000", "104.19539700", "edu", "", "2018"], ["Statistical Iterative CBCT Reconstruction Based on Neural Network", "Key Laboratory of Image Processing and Intelligent Control of Ministry of Education of China, Huazhong University of Science and Technology, Wuhan, China", "Huazhong University of Science and Technology", "Huazhong University of Science and Technology", "\u534e\u4e2d\u5927, \u73de\u55bb\u8def, \u4e1c\u6e56\u65b0\u6280\u672f\u5f00\u53d1\u533a, \u5173\u4e1c\u8857\u9053, \u4e1c\u6e56\u65b0\u6280\u672f\u5f00\u53d1\u533a\uff08\u6258\u7ba1\uff09, \u6d2a\u5c71\u533a (Hongshan), \u6b66\u6c49\u5e02, \u6e56\u5317\u7701, 430074, \u4e2d\u56fd", "30.50975370", "114.40628810", "edu", "", "2018"], ["Fusion Scheme for Semantic and Instance-level Segmentation", "Computer Science Department, Technical University of Cluj-Napoca, Image Processing and Pattern Recognition Group, Romania", "Technical University of Cluj-Napoca", "Technical University of Cluj-Napoca", "Strada Memorandumului 28, Cluj-Napoca 400114, Romania", "46.76929900", "23.58561300", "edu", "", "2018"], ["Where and Who? Automatic Semantic-Aware Person Composition", "", "University of Virginia", "University of Virginia", "University of Virginia, Rotunda Alley, Carr's Hill, Albemarle County, Virginia, 22904-4119, USA", "38.03536820", "-78.50353220", "edu", "", "2018"], ["Findings of the Second Shared Task on Multimodal Machine Translation and Multilingual Image Description", "", "University of Edinburgh", "University of Edinburgh", "New College, New College Courtyard, The Mound, Old Town, Edinburgh, City of Edinburgh, Scotland, EH1 2LX, UK", "55.94951105", "-3.19534913", "edu", "", "2017"], ["Learning to predict where to look in interactive environments using deep recurrent q-learning", "", "National University of Ireland", "National University of Ireland, Galway", "University Rd, Galway, Ireland", "53.27702430", "-9.06148640", "edu", "", "2016"], ["EmotioNet Challenge: Recognition of facial expressions of emotion in the wild", "", "Ohio State University", "The Ohio State University", "The Ohio State University, Woody Hayes Drive, Columbus, Franklin County, Ohio, 43210, USA", "40.00471095", "-83.02859368", "edu", "", "2017"], ["EMPIRICAL PERFORMANCE UPPER BOUNDS FOR IM- AGE AND VIDEO CAPTIONING", "", "New York University", "New York University", "NYU, West 4th Street, NoHo Historic District, NoHo, Manhattan, Manhattan Community Board 2, New York County, NYC, New York, 10012, USA", "40.72925325", "-73.99625394", "edu", "", "2016"], ["Automatic Annotation of Object Instances by Region-Based Recurrent Neural Networks", "Faculty of Electronics, Telecommunications and Information Technology, University Politehnica of Bucharest, Bucharest, 061071, Romania", "University Politehnica of Bucharest", "University Politehnica of Bucharest", "Universitatea Politehnica din Bucure\u0219ti, Novum Invest, Bucure\u0219ti, Militari, Sector 6, Municipiul Bucure\u0219ti, 060042, Rom\u00e2nia", "44.43918115", "26.05044565", "edu", "", "2018"], ["Perceptual Material Attributes Arise in Local Material Recognition", "", "Drexel University", "Drexel University", "Drexel University, Arch Street, Powelton Village, Philadelphia, Philadelphia County, Pennsylvania, 19104, USA", "39.95740000", "-75.19026706", "edu", "", "2016"], ["Intelligent Film Assistant for Personalized Video Creation on Mobile Devices", "University of Applied Sciences, Technikum Wien, Vienna, Austria", "University of Applied Sciences", "National Kaohsiung, University of Applied Sciences, Kaohsiung, Taiwan. jspan@cc.kuas.edu.tw", "No. 415\u865f, Jiangong Road, Sanmin District, Kaohsiung City, Taiwan 807", "22.64894580", "120.32831570", "edu", "", "2017"], ["Crowd Counting via Scale-Adaptive Convolutional Neural Network", "", "Shanghai Jiaotong University", "Shanghai Jiaotong University", "China, Shanghai, Minhang, \u4e1c\u5ddd\u8def \u90ae\u653f\u7f16\u7801: 200240", "31.02522010", "121.43377840", "edu", "", "2018"], ["An Improved Convolution Neural Network for Object Detection Using YOLOv2", "Complex System Control Theory and Application Key Laboratory School of Electrical and Electronic Engineering, Tianjin University of Technology (TJUT), Tianjin, 300384, China", "China", "China", "China", "35.86166000", "104.19539700", "edu", "", "2018"], ["Action Machine: Rethinking Action Recognition in Trimmed Videos", "", "University of Chinese Academy of Sciences", "University of Chinese Academy of Sciences", "University of Chinese Academy of Sciences, UCAS, Yuquanlu, \u7389\u6cc9\u8def, \u7530\u6751, \u6d77\u6dc0\u533a, 100049, \u4e2d\u56fd", "39.90828040", "116.24585270", "edu", "", "2018"], ["S4Net: Single Stage Salient-Instance Segmentation", "", "Tsinghua University", "Tsinghua University", "\u6e05\u534e\u5927\u5b66, 30, \u53cc\u6e05\u8def, \u4e94\u9053\u53e3, \u540e\u516b\u5bb6, \u6d77\u6dc0\u533a, 100084, \u4e2d\u56fd", "40.00229045", "116.32098908", "edu", "", "2017"], ["Answerer in Questioner's Mind for Goal-Oriented Visual Dialogue", "", "Seoul National University", "Seoul National University", "\uc11c\uc6b8\ub300\ud559\uad50, \uc11c\ud638\ub3d9\ub85c, \uc11c\ub454\ub3d9, \uad8c\uc120\uad6c, \uc218\uc6d0\uc2dc, \uacbd\uae30, 16614, \ub300\ud55c\ubbfc\uad6d", "37.26728000", "126.98411510", "edu", "", "2017"], ["Beyond Manual Annotations for Learning Visual Representations", "", "Carnegie Mellon University", "Carnegie Mellon University", "Carnegie Mellon University Silicon Valley, South Akron Road, ARC, Santa Clara County, California, 94035-0016, USA", "37.41021930", "-122.05965487", "edu", "", "2016"], ["Deep Neural Networks for Semantic Segmentation of Multispectral Remote Sensing Imagery", "", "Rochester Institute of Technology", "Rochester Institute of Technology", "Rochester Institute of Technology (RIT), 1, Lomb Memorial Drive, Bailey, Henrietta Town, Monroe County, New York, 14623, USA", "43.08250655", "-77.67121663", "edu", "", "2017"], ["Best of Both Worlds: Transferring Knowledge from Discriminative Learning to a Generative Visual Dialog Model", "", "Georgia Institute of Technology", "Georgia Institute of Technology", "Georgia Tech, Atlantic Drive Northwest, Bellwood, Rockdale, Atlanta, Fulton County, Georgia, 30318, USA", "33.77603300", "-84.39884086", "edu", "", "2017"], ["A vision-grounded dataset for predicting typical locations for verbs", "", "University of California at Berkeley", "International Computer Science Institute, University of California at Berkeley, Berkeley, USA", "1947 Center St, Berkeley, CA 94704, USA", "37.87015430", "-122.27123120", "edu", "", "2018"], ["Leveraging Motion Priors in Videos for Improving Human Segmentation", "", "National Tsing Hua University", "National Tsing Hua University", "\u570b\u7acb\u6e05\u83ef\u5927\u5b78, 101, \u514b\u606d\u6a4b, \u5149\u660e\u91cc, \u8d64\u571f\u5d0e, \u6771\u5340, \u65b0\u7af9\u5e02, 30013, \u81fa\u7063", "24.79254840", "120.99511830", "edu", "", "2018"], ["Gibson Env: Real-World Perception for Embodied Agents", "", "University of California, Berkeley", "University of California, Berkeley", "Berkeley Art Museum and Pacific Film Archive, Bancroft Way, Southside, Berkeley, Alameda County, California, 94720-1076, USA", "37.86871260", "-122.25586815", "edu", "", "2018"], ["Explaining the Ambiguity of Object Detection and 6D Pose from Visual Data", "", "University of Oxford", "University of Oxford", "Radcliffe Camera, Radcliffe Square, Grandpont, Oxford, Oxon, South East, England, OX1 4AJ, UK", "51.75345380", "-1.25400997", "edu", "", "2018"], ["AutoFocus: Efficient Multi-Scale Inference", "", "University of Maryland", "University of Maryland", "The Grand Garage, 5, North Paca Street, Seton Hill, Baltimore, Maryland, 21201, USA", "39.28996850", "-76.62196103", "edu", "", "2018"], ["Large-Scale Active Learning with Approximations of Expected Model Output Changes", "", "Friedrich Schiller University Jena", "Computer Vision Group, Friedrich Schiller University Jena, Germany", "Ernst-Abbe-Platz 2, 07743 Jena, Germany", "50.92776710", "11.58217290", "edu", "", "2016"], ["AISHELL-2: Transforming Mandarin ASR Research Into Industrial Scale", "", "China", "China", "China", "35.86166000", "104.19539700", "edu", "", "2018"], ["Beyond Grids : Learning Graph Representations for Visual Recognition", "", "Carnegie Mellon University", "Carnegie Mellon University", "Carnegie Mellon University Silicon Valley, South Akron Road, ARC, Santa Clara County, California, 94035-0016, USA", "37.41021930", "-122.05965487", "edu", "", "2018"], ["ALFA: Agglomerative Late Fusion Algorithm for Object Detection", "Institute of Computational Mathematics and Information Technologies, Kazan Federal University, Russia", "Russia", "Russia", "Russia", "61.52401000", "105.31875600", "edu", "", "2018"], ["Question Type Guided Attention in Visual Question Answering", "", "California Institute of Technology", "California Institute of Technology", "California Institute of Technology, San Pasqual Walk, Madison Heights, Pasadena, Los Angeles County, California, 91126, USA", "34.13710185", "-118.12527487", "edu", "", "2018"], ["Unsupervised Domain Adaptation for Semantic Segmentation with GANs", "", "GE Global Research Center", "GE Global Research Center", "GE Global Research Center, Aqueduct, Niskayuna, Schenectady County, New York, USA", "42.82982480", "-73.87719385", "edu", "", "2017"], ["Unsupervised Ensemble Regression", "", "IBM Thomas J. Watson Research Center", "IBM Thomas J. Watson Research Center", "IBM Yorktown research lab, Adams Road, Millwood, Town of New Castle, Westchester County, New York, 10562, USA", "41.21002475", "-73.80407056", "company", "", "2017"], ["Dockerface: an easy to install and use Faster R-CNN face detector in a Docker container", "", "Georgia Institute of Technology", "Georgia Institute of Technology", "Georgia Tech, Atlantic Drive Northwest, Bellwood, Rockdale, Atlanta, Fulton County, Georgia, 30318, USA", "33.77603300", "-84.39884086", "edu", "", "2017"], ["Integrating Local Material Recognition with Large-Scale Perceptual Attribute Discovery", "", "Drexel University", "Drexel University", "Drexel University, Arch Street, Powelton Village, Philadelphia, Philadelphia County, Pennsylvania, 19104, USA", "39.95740000", "-75.19026706", "edu", "", "2016"], ["Approximate Distribution Matching for Sequence-to-Sequence Learning", "", "University of California", "University of California, San Francisco, San Francisco, USA", "505 Parnassus Ave, San Francisco, CA 94143, USA", "37.76276550", "-122.45775300", "edu", "", "2018"], ["Webly Supervised Learning of Convolutional Networks", "", "Carnegie Mellon University", "Carnegie Mellon University", "Carnegie Mellon University Silicon Valley, South Akron Road, ARC, Santa Clara County, California, 94035-0016, USA", "37.41021930", "-122.05965487", "edu", "", "2015"], ["Action-driven 3D indoor scene evolution", "", "Microsoft", "Microsoft", "7021 S Memorial Dr, Tulsa, OK 74133, USA", "36.06303740", "-95.88099660", "edu", "", "2016"], ["Pedestrian Detection by Feature Selected Self-Similarity Features", "National Key Laboratory of Science and Technology on Communications, University of Electronic Science and Technology of China, Chengdu, China", "University of Electronic Science and Technology of China", "University of Electronic Science and Technology of China", "Columbus, OH 43210, USA", "40.01419050", "-83.03091430", "edu", "", "2018"], ["Multiple Instance Learning Convolutional Neural Networks for object recognition", "", "University of Missouri", "University of Missouri", "L1, Maguire Boulevard, Lemone Industrial Park, Columbia, Boone County, Missouri, 65201, USA", "38.92676100", "-92.29193783", "edu", "", "2016"], ["Amodal Instance Segmentation", "", "University of California, Berkeley", "University of California, Berkeley", "Berkeley Art Museum and Pacific Film Archive, Bancroft Way, Southside, Berkeley, Alameda County, California, 94720-1076, USA", "37.86871260", "-122.25586815", "edu", "", "2016"], ["Dictionary-Guided Editing Networks for Paraphrase Generation", "", "Beihang University", "Beihang University", "\u5317\u4eac\u822a\u7a7a\u822a\u5929\u5927\u5b66, 37, \u5b66\u9662\u8def, \u4e94\u9053\u53e3, \u540e\u516b\u5bb6, \u6d77\u6dc0\u533a, 100083, \u4e2d\u56fd", "39.98083330", "116.34101249", "edu", "", "2018"], ["Ex Paucis Plura : Learning Affordance Segmentation from Very Few Examples", "", "University of Bonn", "University of Bonn", "Rheinische Friedrich-Wilhelms-Universit\u00e4t Bonn, Arkadenhof, Bonn-Zentrum, Stadtbezirk Bonn, Bonn, Regierungsbezirk K\u00f6ln, Nordrhein-Westfalen, 53113, Deutschland", "50.73381240", "7.10224650", "edu", "", "2018"], ["Story Understanding in Video Advertisements", "", "University of Pittsburgh", "University of Pittsburgh", "University of Pittsburgh, Sutherland Drive, West Oakland, PGH, Allegheny County, Pennsylvania, 15240, USA", "40.44415295", "-79.96243993", "edu", "", "2018"], ["Prototype GOD: prototype Generic Objects Dataset for an Object Detection System based on Bird\u2019s \u2013Eye View", "Visual Intelligence Research Group Electronics and Telecommunications Research Institute, Daejeon, Korea", "Visual Intelligence Research Group Electronics and Telecommunications Research Institute, Daejeon, Korea", "Visual Intelligence Research Group Electronics and Telecommunications Research Institute, Daejeon, Korea", "1110-6 Oryong-dong, Buk-gu, Kwangju, South Korea", "35.22537080", "126.84618340", "edu", "", "2018"], ["A Multi-Stream Convolutional Neural Network Framework for Group Activity Recognition", "", "Amirkabir University of Technology", "Amirkabir University of Technology", "\u062f\u0627\u0646\u0634\u06af\u0627\u0647 \u0635\u0646\u0639\u062a\u06cc \u0627\u0645\u06cc\u0631\u06a9\u0628\u06cc\u0631, \u0648\u0644\u06cc \u0639\u0635\u0631, \u0645\u06cc\u062f\u0627\u0646 \u0648\u0644\u06cc\u0639\u0635\u0631, \u0645\u0646\u0637\u0642\u0647 \u06f6 \u0634\u0647\u0631 \u062a\u0647\u0631\u0627\u0646, \u062a\u0647\u0631\u0627\u0646, \u0628\u062e\u0634 \u0645\u0631\u06a9\u0632\u06cc \u0634\u0647\u0631\u0633\u062a\u0627\u0646 \u062a\u0647\u0631\u0627\u0646, \u0634\u0647\u0631\u0633\u062a\u0627\u0646 \u062a\u0647\u0631\u0627\u0646, \u0627\u0633\u062a\u0627\u0646 \u062a\u0647\u0631\u0627\u0646, \u0646\u0628\u0634 \u0628\u0631\u0627\u062f\u0631\u0627\u0646 \u0645\u0638\u0641\u0631, \u200f\u0627\u06cc\u0631\u0627\u0646\u200e", "35.70451400", "51.40972058", "edu", "", "2018"], ["Peephole: Predicting Network Performance Before Training", "", "Chinese University of Hong Kong", "The Chinese University of Hong Kong", "\u4e2d\u5927 CUHK, NA\u68af New Asia Stairs, \u99ac\u6599\u6c34 Ma Liu Shui, \u4e5d\u809a\u6751 Kau To Village, \u6c99\u7530\u5340 Sha Tin District, \u65b0\u754c New Territories, HK, DD193 1191, \u4e2d\u56fd", "22.42031295", "114.20788644", "edu", "", "2017"], ["AutoMarkov DNNs for object classification", "University Politehnica of Bucharest, Faculty of Electronics, Telecommunications and Information Technology, Applied Electronics and Information Engineering Department, 1-3, Iuliu Maniu Ave., Romania 061071", "University Politehnica of Bucharest", "University Politehnica of Bucharest", "Universitatea Politehnica din Bucure\u0219ti, Novum Invest, Bucure\u0219ti, Militari, Sector 6, Municipiul Bucure\u0219ti, 060042, Rom\u00e2nia", "44.43918115", "26.05044565", "edu", "", "2016"], ["Looking deeper and transferring attention for image captioning", "Shanghai Engineering Research Center of Industrial Vision Perception & Intelligent Computing, Shanghai, China", "Shanghai Engineering Research Center of Industrial Vision Perception & Intelligent Computing, Shanghai, China", "Shanghai Engineering Research Center of Industrial Vision Perception & Intelligent Computing, Shanghai, China", "Shanghai, China", "31.23039040", "121.47370210", "edu", "", "2018"], ["Evaluating ResNeXt Model Architecture for Image Classification", "", "University of Waterloo", "University of Waterloo", "University of Waterloo, 200, University Avenue West, Northdale, Beechwood, Waterloo, Regional Municipality of Waterloo, Ontario, N2L 3G1, Canada", "43.47061295", "-80.54724732", "edu", "", "2018"], ["Robot Classification of Human Interruptibility and a Study of Its Effects", "Georgia Institute of Technology, Atlanta, GA", "Georgia Institute of Technology", "Georgia Institute of Technology", "Georgia Tech, Atlantic Drive Northwest, Bellwood, Rockdale, Atlanta, Fulton County, Georgia, 30318, USA", "33.77603300", "-84.39884086", "edu", "", "2018"], ["Fake Sentence Detection as a Training Task for Sentence Encoding", "", "Stony Brook University", "Stony Brook University", "Stony Brook University, 100, Nicolls Road, Stony Brook, Suffolk County, New York, 11794, USA", "40.91531960", "-73.12706260", "edu", "", "2018"], ["Decoupled Novel Object Captioner", "", "Chinese Academy of Sciences", "Chinese Academy of Sciences", "\u4e2d\u56fd\u79d1\u5b66\u9662\u5fc3\u7406\u7814\u7a76\u6240, 16, \u6797\u8403\u8def, \u671d\u9633\u533a / Chaoyang, \u5317\u4eac\u5e02, 100101, \u4e2d\u56fd", "40.00447950", "116.37023800", "edu", "", "2018"], ["ScratchDet : Training Single-Shot Object Detectors from Scratch", "", "University of Chinese Academy of Sciences", "University of Chinese Academy of Sciences", "University of Chinese Academy of Sciences, UCAS, Yuquanlu, \u7389\u6cc9\u8def, \u7530\u6751, \u6d77\u6dc0\u533a, 100049, \u4e2d\u56fd", "39.90828040", "116.24585270", "edu", "", "2018"], ["The Emotional Impact of Audio-Visual Stimuli", "", "Rochester Institute of Technology", "Rochester Institute of Technology", "Rochester Institute of Technology (RIT), 1, Lomb Memorial Drive, Bailey, Henrietta Town, Monroe County, New York, 14623, USA", "43.08250655", "-77.67121663", "edu", "", "2018"], ["Question action relevance and editing for visual question answering", "Dipartimento di Informatica, Universit\u00e0 di Salerno, Fisciano, Italy", "George Mason University", "George Mason University", "George Mason University, Aquia Creek Lane, Country Club View, Blue Oaks, Fairfax County, Virginia, 22030-9998, USA", "38.83133325", "-77.30798839", "edu", "", "2018"], ["Cross Modal Distillation for Supervision Transfer", "", "University of California, Berkeley", "University of California, Berkeley", "Berkeley Art Museum and Pacific Film Archive, Bancroft Way, Southside, Berkeley, Alameda County, California, 94720-1076, USA", "37.86871260", "-122.25586815", "edu", "", "2016"], ["Hot Anchors: A Heuristic Anchors Sampling Method in RCNN-Based Object Detection", "", "University of Chinese Academy of Sciences", "University of Chinese Academy of Sciences", "University of Chinese Academy of Sciences, UCAS, Yuquanlu, \u7389\u6cc9\u8def, \u7530\u6751, \u6d77\u6dc0\u533a, 100049, \u4e2d\u56fd", "39.90828040", "116.24585270", "edu", "", "2018"], ["HiDDeN: Hiding Data With Deep Networks", "", "Stanford University", "Stanford University", "Stanford University, Memorial Way, Stanford, Santa Clara County, California, 94305-6015, USA", "37.43131385", "-122.16936535", "edu", "", "2018"], ["Spatial-Aware Object Embeddings for Zero-Shot Localization and Classification of Actions", "", "University of Amsterdam", "University of Amsterdam", "Institute for Logic, Language and Computation (ILLC), 107, Science Park, Oost-Watergraafsmeer, Amsterdam, Oost, Amsterdam, Noord-Holland, Nederland, 1098XG, Nederland", "52.35536550", "4.95016440", "edu", "", "2017"], ["Subitizing with Variational Autoencoders", "", "University of Amsterdam", "University of Amsterdam", "Institute for Logic, Language and Computation (ILLC), 107, Science Park, Oost-Watergraafsmeer, Amsterdam, Oost, Amsterdam, Noord-Holland, Nederland, 1098XG, Nederland", "52.35536550", "4.95016440", "edu", "", "2018"], ["PoseTrack: Joint Multi-person Pose Estimation and Tracking", "", "University of Adelaide", "University of Adelaide", "University of Adelaide, North Terrace, Adelaide, 5000, City of Adelaide, South Australia, 5000, Australia", "-34.91892260", "138.60423668", "edu", "", "2017"], ["Fast, Diverse and Accurate Image Captioning Guided By Part-of-Speech", "", "University of Illinois, Urbana-Champaign", "University of Illinois, Urbana-Champaign", "B-3, South Mathews Avenue, Urbana, Champaign County, Illinois, 61801, USA", "40.11116745", "-88.22587665", "edu", "", "2018"], ["Answer-Type Prediction for Visual Question Answering", "", "Rochester Institute of Technology", "Rochester Institute of Technology", "Rochester Institute of Technology (RIT), 1, Lomb Memorial Drive, Bailey, Henrietta Town, Monroe County, New York, 14623, USA", "43.08250655", "-77.67121663", "edu", "", "2016"], ["Semantic Image Segmentation via Deep Parsing Network", "", "Chinese University of Hong Kong", "The Chinese University of Hong Kong", "\u4e2d\u5927 CUHK, NA\u68af New Asia Stairs, \u99ac\u6599\u6c34 Ma Liu Shui, \u4e5d\u809a\u6751 Kau To Village, \u6c99\u7530\u5340 Sha Tin District, \u65b0\u754c New Territories, HK, DD193 1191, \u4e2d\u56fd", "22.42031295", "114.20788644", "edu", "", "2015"], ["Bird Species Classification using Transfer Learning with Multistage Training", "", "India", "India", "India", "20.59368400", "78.96288000", "edu", "", "2018"], ["Traits & Transferability of Adversarial Examples against Instance Segmentation & Object Detection", "", "University of Illinois, Urbana-Champaign", "University of Illinois, Urbana-Champaign", "B-3, South Mathews Avenue, Urbana, Champaign County, Illinois, 61801, USA", "40.11116745", "-88.22587665", "edu", "", "2018"], ["Hierarchical Recurrent Neural Encoder for Video Representation with Application to Captioning", "", "University of Technology Sydney", "University of Technology Sydney", "University of Technology Sydney, Omnibus Lane, Ultimo, Sydney, NSW, 2007, Australia", "-33.88096510", "151.20107299", "edu", "", "2016"], ["Self-Contained Stylization via Steganography for Reverse and Serial Style Transfer", "", "National Chiao Tung University", "National Chiao Tung University", "NCTU;\u4ea4\u5927;\u4ea4\u901a\u5927\u5b78;\u4ea4\u5927\u5149\u5fa9\u6821\u5340;\u4ea4\u901a\u5927\u5b78\u5149\u5fa9\u6821\u5340, 1001, \u5927\u5b78\u8def, \u5149\u660e\u91cc, \u8d64\u571f\u5d0e, \u6771\u5340, \u65b0\u7af9\u5e02, 30010, \u81fa\u7063", "24.78676765", "120.99724412", "edu", "", "2018"], ["Improving Fast Segmentation With Teacher-Student Learning", "", "Nanyang Technological University", "Nanyang Technological University", "NTU, Faculty Avenue, Jurong West, Southwest, 637460, Singapore", "1.34841040", "103.68297965", "edu", "", "2018"], ["Describing Natural Images Containing Novel Objects with Knowledge Guided Assitance", "", "Karlsruhe Institute of Technology", "Karlsruhe Institute of Technology", "KIT, Leopoldshafener Allee, Linkenheim, Linkenheim-Hochstetten, Landkreis Karlsruhe, Regierungsbezirk Karlsruhe, Baden-W\u00fcrttemberg, 76351, Deutschland", "49.10184375", "8.43312560", "edu", "", "2017"], ["Do deep features retrieve X ? : A tool for quick inspection of deep visual similarities", "", "University of British Columbia", "University of British Columbia", "University of British Columbia, Eagles Drive, Hawthorn Place, University Endowment Lands, Metro Vancouver, British Columbia, V6T, Canada", "49.25839375", "-123.24658161", "edu", "", "2015"], ["The Middle Child Problem: Revisiting Parametric Min-Cut and Seeds for Object Proposals", "", "Oregon State University", "Oregon State University", "OSU Beaver Store, 538, Southwest 6th Avenue, Portland Downtown, Portland, Multnomah County, Oregon, 97204, USA", "45.51982890", "-122.67797964", "edu", "", "2015"], ["The Unreasonable Effectiveness of Noisy Data for Fine-Grained Recognition", "", "Stanford University", "Stanford University", "Stanford University, Memorial Way, Stanford, Santa Clara County, California, 94305-6015, USA", "37.43131385", "-122.16936535", "edu", "", "2016"], ["Traffic-Sign Detection and Classification in the Wild", "", "China", "China", "China", "35.86166000", "104.19539700", "edu", "", "2016"], ["Progressively Diffused Networks for Semantic Image Segmentation", "", "SenseTime", "SenseTime", "China, Beijing Shi, Haidian Qu, WuDaoKou, Zhongguancun E Rd, 1\u53f7-7", "39.99300800", "116.32988200", "company", "1 Zhongguancun E Rd, Haidian Qu, China", "2017"], ["Interact as You Intend: Intention-Driven Human-Object Interaction Detection", "", "Member", "Member", "1322 N Inglewood Ave, Coffeyville, KS 67337, USA", "37.05826350", "-95.67914910", "edu", "", "2018"], ["Segment-Phrase Table for Semantic Segmentation, Visual Entailment and Paraphrasing", "", "University of Washington", "University of Washington", "University of Washington, Rainier Vista, Montlake, University District, Seattle, King County, Washington, 98195, USA", "47.65432380", "-122.30800894", "edu", "", "2015"], ["Loss Functions for Multiset Prediction", "", "New York University", "New York University", "NYU, West 4th Street, NoHo Historic District, NoHo, Manhattan, Manhattan Community Board 2, New York County, NYC, New York, 10012, USA", "40.72925325", "-73.99625394", "edu", "", "2018"], ["Fast Online Object Tracking and Segmentation: A Unifying Approach", "", "University of Oxford", "University of Oxford", "Radcliffe Camera, Radcliffe Square, Grandpont, Oxford, Oxon, South East, England, OX1 4AJ, UK", "51.75345380", "-1.25400997", "edu", "", "2018"], ["Looking for ELMo's friends: Sentence-Level Pretraining Beyond Language Modeling.", "", "New York University", "New York University", "NYU, West 4th Street, NoHo Historic District, NoHo, Manhattan, Manhattan Community Board 2, New York County, NYC, New York, 10012, USA", "40.72925325", "-73.99625394", "edu", "", "2018"], ["Transferable Semi-Supervised Semantic Segmentation", "", "Beckman Institute", "Beckman Institute", "Beckman Institute, The Presidents' Walk, Urbana, Champaign County, Illinois, 61801-2341, USA", "40.11571585", "-88.22750772", "edu", "", "2018"], ["Multi-modal Capsule Routing for Actor and Action Video Segmentation Conditioned on Natural Language Queries", "", "University of Central Florida", "University of Central Florida", "University of Central Florida, Libra Drive, University Park, Orange County, Florida, 32816, USA", "28.59899755", "-81.19712501", "edu", "", "2018"], ["Enhancement of SSD by concatenating feature maps for object detection.", "", "Seoul National University", "Seoul National University", "\uc11c\uc6b8\ub300\ud559\uad50, \uc11c\ud638\ub3d9\ub85c, \uc11c\ub454\ub3d9, \uad8c\uc120\uad6c, \uc218\uc6d0\uc2dc, \uacbd\uae30, 16614, \ub300\ud55c\ubbfc\uad6d", "37.26728000", "126.98411510", "edu", "", "2017"], ["Generation with Recursive Neural Networks", "", "Stanford University", "Stanford University", "Stanford University, Memorial Way, Stanford, Santa Clara County, California, 94305-6015, USA", "37.43131385", "-122.16936535", "edu", "", "2016"], ["Active learning and discovery of object categories in the presence of unnameable instances", "Computer Vision Group, Friedrich Schiller University Jena, Germany", "Friedrich Schiller University Jena", "Computer Vision Group, Friedrich Schiller University Jena, Germany", "Ernst-Abbe-Platz 2, 07743 Jena, Germany", "50.92776710", "11.58217290", "edu", "", "2015"], ["Ambiguity Helps: Classification with Disagreements in Crowdsourced Annotations", "", "Harvard University", "Harvard University", "Harvard University, Soldiers Field Road, Allston, Boston, Suffolk County, Massachusetts, 02163, USA", "42.36782045", "-71.12666653", "edu", "", "2016"], ["Spott: On-the-Spot e-Commerce for Television Using Deep Learning-Based Video Analysis Techniques", "Ghent University - imec, ELIS - IDLab, Pietersnieuwstraat, Ghent", "Ghent University - imec", "Ghent University - imec, ELIS - IDLab, Pietersnieuwstraat, Ghent", "Technologiepark-Zwijnaarde 122, 9052 Gent, Belgium", "51.01316270", "3.70941850", "edu", "", "2017"], ["Improving Multi-Person Pose Estimation using Label Correction", "", "Keio University", "Keio University", "\u7db1\u5cf6\u5e02\u6c11\u306e\u68ee, \u3051\u3064\u308f\u308a\u5742, \u6e2f\u5317\u533a, \u6a2a\u6d5c\u5e02, \u795e\u5948\u5ddd\u770c, \u95a2\u6771\u5730\u65b9, 223-0053, \u65e5\u672c", "35.54169690", "139.63471840", "edu", "", "2018"], ["A Focused Dynamic Attention Model for Visual Question Answering", "", "National University of Singapore", "National University of Singapore", "NUS, Former 1936 British Outpost, Nepal Hill, Clementi, Southwest, 117542, Singapore", "1.29620180", "103.77689944", "edu", "", "2016"], ["Solving Visual Madlibs with Multiple Cues", "", "University of Illinois, Urbana-Champaign", "University of Illinois, Urbana-Champaign", "B-3, South Mathews Avenue, Urbana, Champaign County, Illinois, 61801, USA", "40.11116745", "-88.22587665", "edu", "", "2016"], ["Unprecedented Usage of Pre-trained CNNs on Beauty Product", "University of Malaya, Kuala Lumpur, Malaysia", "University of Malaya", "University of Malaya", "UM, Lingkaran Wawasan, Bukit Pantai, Bangsar, KL, 50603, Malaysia", "3.12267405", "101.65356103", "edu", "", "2018"], ["Improved Image Captioning via Policy Gradient optimization of SPIDEr", "", "University of Oxford", "University of Oxford", "Radcliffe Camera, Radcliffe Square, Grandpont, Oxford, Oxon, South East, England, OX1 4AJ, UK", "51.75345380", "-1.25400997", "edu", "", "2017"], ["High performance and fast object detection in road environments", "DGIST", "DGIST", "DGIST", "South Korea, Daegu, Dalseong-gun, Yuga-myeon, \ud14c\ud06c\ub178\uc911\uc559\ub300\ub85c 333", "35.70528600", "128.45710200", "edu", "", "2017"], ["Object Recognition Based on Amounts of Unlabeled Data", "", "Beijing Institute of Technology", "Beijing Institute of Technology University", "\u5317\u4eac\u7406\u5de5\u5927\u5b66, 5, \u4e2d\u5173\u6751\u5357\u5927\u8857, \u4e2d\u5173\u6751, \u7a3b\u9999\u56ed\u5357\u793e\u533a, \u6d77\u6dc0\u533a, \u5317\u4eac\u5e02, 100872, \u4e2d\u56fd", "39.95866520", "116.30971281", "edu", "", "2016"], ["Multi-Label Music Genre Classification from Audio, Text and Images Using Deep Features", "", "Universitat Pompeu Fabra", "Universitat Pompeu Fabra", "Dip\u00f2sit de les Aig\u00fces, Carrer de Wellington, la Vila Ol\u00edmpica del Poblenou, Ciutat Vella, Barcelona, BCN, CAT, 08071, Espa\u00f1a", "41.39044285", "2.18891949", "edu", "", "2017"], ["Zero-Shot Detection", "", "Boston University", "Boston University", "BU, Bay State Road, Fenway, Boston, Suffolk County, Massachusetts, 02215, USA", "42.35042530", "-71.10056114", "edu", "", "2018"], ["What are the Visual Features Underlying Human Versus Machine Vision?", "", "Brown University", "Brown University", "Brown University, Waterman Street, College Hill, Providence, Bristol, Rhode Island, 02912, USA", "41.82686820", "-71.40123146", "edu", "", "2017"], ["Material Recognition from Local Appearance in Global Context", "", "Drexel University", "Drexel University", "Drexel University, Arch Street, Powelton Village, Philadelphia, Philadelphia County, Pennsylvania, 19104, USA", "39.95740000", "-75.19026706", "edu", "", "2016"], ["Complex Object Classification: A Multi-Modal Multi-Instance Multi-Label Deep Network with Optimal Transport", "Nanjing University, Nanjing, China", "Nanjing University", "Nanjing University", "NJU, \u4e09\u6c5f\u8def, \u9f13\u697c\u533a, \u5357\u4eac\u5e02, \u6c5f\u82cf\u7701, 210093, \u4e2d\u56fd", "32.05659570", "118.77408833", "edu", "", "2018"], ["What's the point: Semantic segmentation with point supervision", "", "University of Edinburgh", "University of Edinburgh", "New College, New College Courtyard, The Mound, Old Town, Edinburgh, City of Edinburgh, Scotland, EH1 2LX, UK", "55.94951105", "-3.19534913", "edu", "", "2016"], ["Extreme Clicking for Efficient Object Annotation", "", "University of Edinburgh", "University of Edinburgh", "New College, New College Courtyard, The Mound, Old Town, Edinburgh, City of Edinburgh, Scotland, EH1 2LX, UK", "55.94951105", "-3.19534913", "edu", "", "2017"], ["Visual Question Answering with Memory-Augmented Networks", "", "University of Adelaide", "University of Adelaide", "University of Adelaide, North Terrace, Adelaide, 5000, City of Adelaide, South Australia, 5000, Australia", "-34.91892260", "138.60423668", "edu", "", "2018"], ["Data Augmentation for Cnn-Based People Detection in Aerial Images", "Department of Information Engineering and Computer Science, Feng Chia University, Taiwan", "Feng Chia University", "Feng Chia University", "\u9022\u7532\u5927\u5b78, 100, \u6587\u83ef\u8def, \u897f\u5e73\u91cc, \u897f\u5c6f\u5340, \u81fa\u4e2d\u5e02, 40724, \u81fa\u7063", "24.18005755", "120.64836072", "edu", "", "2018"], ["Deep correlation for matching images and text", "Centre for Vision, Speech and Signal Processing, University of Surrey, Guildford, United Kingdom, GU2 7XH", "University of Surrey", "University of Surrey", "University of Surrey, Spine Road, Guildford Park, Guildford, Surrey, South East, England, GU2 7XH, UK", "51.24303255", "-0.59001382", "edu", "", "2015"], ["Recurrent Models for Situation Recognition", "", "University of Illinois, Urbana-Champaign", "University of Illinois, Urbana-Champaign", "B-3, South Mathews Avenue, Urbana, Champaign County, Illinois, 61801, USA", "40.11116745", "-88.22587665", "edu", "", "2017"], ["Deep Attribute-preserving Metric Learning for Natural Language Object Retrieval", "National University of Singapore, Singapore, Singapore", "National University of Singapore", "National University of Singapore", "NUS, Former 1936 British Outpost, Nepal Hill, Clementi, Southwest, 117542, Singapore", "1.29620180", "103.77689944", "edu", "", "2017"], ["Using Syntax to Ground Referring Expressions in Natural Images", "", "Carnegie Mellon University", "Carnegie Mellon University", "Carnegie Mellon University Silicon Valley, South Akron Road, ARC, Santa Clara County, California, 94035-0016, USA", "37.41021930", "-122.05965487", "edu", "", "2018"], ["GANtruth - an unpaired image-to-image translation method for driving scenarios", "", "KTH Royal Institute of Technology, Stockholm", "KTH Royal Institute of Technology, Stockholm", "KTH, Teknikringen, L\u00e4rkstaden, Norra Djurg\u00e5rden, \u00d6stermalms stadsdelsomr\u00e5de, Sthlm, Stockholm, Stockholms l\u00e4n, Svealand, 114 28, Sverige", "59.34986645", "18.07063213", "edu", "", "2018"], ["Revisiting Pre-training: An Efficient Training Method for Image Classification", "", "Beckman Institute", "Beckman Institute", "Beckman Institute, The Presidents' Walk, Urbana, Champaign County, Illinois, 61801-2341, USA", "40.11571585", "-88.22750772", "edu", "", "2018"], ["Evaluation of Segmentation Quality via Adaptive Composition of Reference Segmentations", "School of Engineering, University of California, Merced, CA", "China", "China", "China", "35.86166000", "104.19539700", "edu", "", "2017"], ["Semantic Segmentation With Object Clique Potentials", "", "Chinese University of Hong Kong", "The Chinese University of Hong Kong", "\u4e2d\u5927 CUHK, NA\u68af New Asia Stairs, \u99ac\u6599\u6c34 Ma Liu Shui, \u4e5d\u809a\u6751 Kau To Village, \u6c99\u7530\u5340 Sha Tin District, \u65b0\u754c New Territories, HK, DD193 1191, \u4e2d\u56fd", "22.42031295", "114.20788644", "edu", "", "2015"], ["Neural Module Networks", "", "University of California, Berkeley", "University of California, Berkeley", "Berkeley Art Museum and Pacific Film Archive, Bancroft Way, Southside, Berkeley, Alameda County, California, 94720-1076, USA", "37.86871260", "-122.25586815", "edu", "", "2016"], ["ImagineNet : Style Transfer from Fine Art to Graphical User Interfaces", "", "Stanford University", "Stanford University", "Stanford University, Memorial Way, Stanford, Santa Clara County, California, 94305-6015, USA", "37.43131385", "-122.16936535", "edu", "", "2018"], ["Investigating the feature collection for semantic segmentation via single skip connection", "", "Ajou University", "Ajou University", "\uc544\uc8fc\ub300\ud559\uad50, \uc131\ud638\ub300\uad50, \uc774\uc758\ub3d9, \uc601\ud1b5\uad6c, \uc218\uc6d0\uc2dc, \uacbd\uae30, 16499, \ub300\ud55c\ubbfc\uad6d", "37.28300030", "127.04548469", "edu", "", "2017"], ["Understanding and Controlling User Linkability in Decentralized Learning", "", "Max Planck Institute for Informatics", "Max Planck Institute for Informatics", "MPII, E1 4, Campus, Universit\u00e4t, Sankt Johann, Bezirk Mitte, Saarbr\u00fccken, Regionalverband Saarbr\u00fccken, Saarland, 66123, Deutschland", "49.25795660", "7.04577417", "edu", "", "2018"], ["PolyMapper: Extracting City Maps using Polygons", "", "ETH Z\u00fcrich", "ETH Z\u00fcrich", "ETH Z\u00fcrich, 101, R\u00e4mistrasse, Hochschulen, Altstadt, Z\u00fcrich, Bezirk Z\u00fcrich, Z\u00fcrich, 8092, Schweiz/Suisse/Svizzera/Svizra", "47.37645340", "8.54770931", "edu", "", "2018"], ["Weakly and Semi Supervised Human Body Part Parsing via Pose-Guided Knowledge Transfer", "", "Shanghai Jiao Tong University", "Shanghai Jiao Tong University", "\u4e0a\u6d77\u4ea4\u901a\u5927\u5b66\uff08\u5f90\u6c47\u6821\u533a\uff09, \u6dee\u6d77\u897f\u8def, \u756a\u79ba\u5c0f\u533a, \u5e73\u9634\u6865, \u5f90\u6c47\u533a, \u4e0a\u6d77\u5e02, 200052, \u4e2d\u56fd", "31.20081505", "121.42840681", "edu", "", "2018"], ["A Fast Multi-Task CNN for Spatial Understanding of Traffic Scenes", "Institute of Control Theory and Systems Engineering, TU Dortmund University, Otto-Hahn-Str. 8, Dortmund, 44227, Germany", "TU Dortmund University", "Institute of Control Theory and Systems Engineering, TU Dortmund University, Otto-Hahn-Str. 8, Dortmund, 44227, Germany", "Emil-Figge-Stra\u00dfe 50, 44227 Dortmund, Germany", "51.49219020", "7.41413620", "edu", "", "2018"], ["Resolving References to Objects in Photographs using the Words-As-Classifiers Model", "", "Bielefeld University", "Bielefeld University", "Fachhochschule Bielefeld FB Gestaltung, 3, Lampingstra\u00dfe, Mitte, Bielefeld, Regierungsbezirk Detmold, Nordrhein-Westfalen, 33615, Deutschland", "52.02804210", "8.51148270", "edu", "", "2016"], ["Image Captioning with Word Level Attention", "Department of Computer Science & Technology, Tongji University, Shanghai, P. R. China", "Tongji University", "Tongji University", "\u540c\u6d4e\u5927\u5b66, 1239, \u56db\u5e73\u8def, \u6c5f\u6e7e, \u8679\u53e3\u533a, \u4e0a\u6d77\u5e02, 200092, \u4e2d\u56fd", "31.28473925", "121.49694909", "edu", "", "2018"], ["Class Rectification Hard Mining for Imbalanced Deep Learning", "", "Queen Mary University of London", "Queen Mary University of London", "Queen Mary (University of London), Mile End Road, Globe Town, Mile End, London Borough of Tower Hamlets, London, Greater London, England, E1 4NS, UK", "51.52472720", "-0.03931035", "edu", "", "2017"], ["Learning deep structured network for weakly supervised change detection", "", "University of Western Australia", "University of Western Australia", "UWA, 35, Underwood Avenue, Daglish, Perth, Western Australia, 6009, Australia", "-31.95040445", "115.79790037", "edu", "", "2017"], ["Towards semantic visual representation: augmenting image representation with natural language descriptors", "Indian Institute of Science, Bangalore, India", "Indian Institute of Science Bangalore", "Indian Institute of Science Bangalore", "IISc, Gulmohar Marg, RMV Stage II - 1st Block, Aramane Nagara Ward, West Zone, Bengaluru, Bangalore Urban, Karnataka, 560012, India", "13.02223470", "77.56718325", "edu", "", "2016"], ["Sequence to Sequence -- Video to Text", "", "University of California, Berkeley", "University of California, Berkeley", "Berkeley Art Museum and Pacific Film Archive, Bancroft Way, Southside, Berkeley, Alameda County, California, 94720-1076, USA", "37.86871260", "-122.25586815", "edu", "", "2015"], ["Efficient Coarse-to-Fine Non-Local Module for the Detection of Small Objects.", "", "Weizmann Institute of Science", "Weizmann Institute of Science", "\u05de\u05db\u05d5\u05df \u05d5\u05d9\u05e6\u05de\u05df \u05dc\u05de\u05d3\u05e2, \u05e9\u05d3\u05e8\u05ea \u05de\u05e8\u05db\u05d5\u05e1 \u05d6\u05d9\u05d5, \u05de\u05e2\u05d5\u05e0\u05d5\u05ea \u05e9\u05d9\u05d9\u05df, \u05d0\u05d7\u05d5\u05d6\u05d5\u05ea \u05d4\u05e0\u05e9\u05d9\u05d0, \u05e8\u05d7\u05d5\u05d1\u05d5\u05ea, \u05de\u05d7\u05d5\u05d6 \u05d4\u05de\u05e8\u05db\u05d6, NO, \u05d9\u05e9\u05e8\u05d0\u05dc", "31.90784990", "34.81334092", "edu", "", "2018"], ["Semantic Instance Annotation of Street Scenes by 3D to 2D Label Transfer", "", "University of Washington", "University of Washington", "University of Washington, Rainier Vista, Montlake, University District, Seattle, King County, Washington, 98195, USA", "47.65432380", "-122.30800894", "edu", "", "2016"], ["RefineNet: Multi-path Refinement Networks for High-Resolution Semantic Segmentation", "", "University of Adelaide", "University of Adelaide", "University of Adelaide, North Terrace, Adelaide, 5000, City of Adelaide, South Australia, 5000, Australia", "-34.91892260", "138.60423668", "edu", "", "2017"], ["Beyond caption to narrative: Video captioning with multiple sentences", "", "University of Tokyo", "University of Tokyo", "\u6771\u4eac\u5927\u5b66 \u67cf\u30ad\u30e3\u30f3\u30d1\u30b9, \u5b66\u878d\u5408\u306e\u9053, \u67cf\u5e02, \u5343\u8449\u770c, \u95a2\u6771\u5730\u65b9, 277-8583, \u65e5\u672c", "35.90204480", "139.93622009", "edu", "", "2016"], ["Deep patch learning for weakly supervised object classification and discovery", "", "China", "China", "China", "35.86166000", "104.19539700", "edu", "", "2017"], ["LDS-Inspired Residual Networks", "", "Member", "Member", "1322 N Inglewood Ave, Coffeyville, KS 67337, USA", "37.05826350", "-95.67914910", "edu", "", "2018"], ["Fast Patch-based Style Transfer of Arbitrary Style.", "", "University of British Columbia", "University of British Columbia", "University of British Columbia, Eagles Drive, Hawthorn Place, University Endowment Lands, Metro Vancouver, British Columbia, V6T, Canada", "49.25839375", "-123.24658161", "edu", "", "2016"], ["Mining Object Parts from CNNs via Active Question-Answering", "", "UCLA", "University of California, Los Angeles", "Los Angeles, CA 90095, USA", "34.06892100", "-118.44518110", "edu", "", "2017"], ["A review of object detection based on convolutional neural network", "Fundamental Science on Communication Information Transmission and Fusion Technology Laboratory, Hangzhou 310018, China", "Fundamental Science on Communication Information Transmission and Fusion Technology Laboratory, Hangzhou 310018, China", "Fundamental Science on Communication Information Transmission and Fusion Technology Laboratory, Hangzhou 310018, China", "Jianggan, Hangzhou, Zhejiang, China, 310018", "30.31600970", "120.37394070", "edu", "", "2017"], ["Online Real-Time Multiple Spatiotemporal Action Localisation and Prediction", "", "Oxford University", "Oxford University", "University College, Logic Lane, Grandpont, Oxford, Oxon, South East, England, OX1 4EX, UK", "51.75208490", "-1.25166460", "edu", "", "2017"], ["Procedural Generation of Videos to Train Deep Action Recognition Networks", "", "Toyota Research Institute", "Toyota Research Institute", "Toyota Research Institute, 4440, West El Camino Real, Los Altos, Santa Clara County, California, 94022, USA", "37.40253645", "-122.11655107", "edu", "", "2017"], ["High-Value Target Detection", "", "University of Tartu", "UNIVERSITY OF TARTU", "Paabel, University of Tartu, 17, \u00dclikooli, Kesklinn, Tartu linn, Tartu, Tartu linn, Tartu maakond, 53007, Eesti", "58.38131405", "26.72078081", "edu", "", "2018"], ["Looking Beyond a Clever Narrative: Visual Context and Attention are Primary Drivers of Affect in Video Advertisements", "", "University of Illinois, Urbana-Champaign", "University of Illinois, Urbana-Champaign", "B-3, South Mathews Avenue, Urbana, Champaign County, Illinois, 61801, USA", "40.11116745", "-88.22587665", "edu", "", "2018"], ["Counting Everyday Objects in Everyday Scenes", "", "Georgia Institute of Technology", "Georgia Institute of Technology", "Georgia Tech, Atlantic Drive Northwest, Bellwood, Rockdale, Atlanta, Fulton County, Georgia, 30318, USA", "33.77603300", "-84.39884086", "edu", "", "2017"], ["Bottle Detection in the Wild Using Low-Altitude Unmanned Aerial Vehicles", "Wuhan University, School of Electronic Information, Wuhan, 430072, China", "Wuhan University of Technology", "Wuhan University of Technology", "\u6b66\u6c49\u7406\u5de5\u5927\u5b66-\u4f59\u5bb6\u5934\u6821\u533a, \u4ea4\u901a\u4e8c\u8def, \u6768\u56ed\u8857\u9053, \u6b66\u660c\u533a (Wuchang), \u6b66\u6c49\u5e02, \u6e56\u5317\u7701, 430062, \u4e2d\u56fd", "30.60903415", "114.35142840", "edu", "", "2018"], ["Deep Learning Based Surveillance System for Open Critical Areas", "", "University of Florence", "University of Florence", "Piazza di San Marco, 4, 50121 Firenze FI, Italy", "43.77764260", "11.25976500", "edu", "", "2018"], ["An efficient license plate recognition system using convolution neural networks", "Department of Electrical Engineering, National Taiwan Normal University, Taipei 106, Taiwan", "National Taiwan Normal University", "National Taiwan Normal University", "\u5e2b\u5927\u5206\u90e8, 88, \u6c40\u5dde\u8def\u56db\u6bb5, \u842c\u5e74\u91cc, \u6587\u5c71\u5340, \u81fa\u5317\u5e02, 11677, \u81fa\u7063", "25.00823205", "121.53577153", "edu", "", "2018"], ["Online Adaptation of Convolutional Neural Networks for Video Object Segmentation", "", "RWTH Aachen University", "RWTH Aachen University", "RWTH Aachen, Mies-van-der-Rohe-Stra\u00dfe, K\u00f6nigsh\u00fcgel, Aachen-Mitte, Aachen, St\u00e4dteregion Aachen, Regierungsbezirk K\u00f6ln, Nordrhein-Westfalen, 52074, Deutschland", "50.77917030", "6.06728733", "edu", "", "2017"], ["Attacking Visual Language Grounding with Adversarial Examples: A Case Study on Neural Image Captioning", "", "China", "China", "China", "35.86166000", "104.19539700", "edu", "", "2018"], ["Incremental Segmentation on Private Data without Catastrophic Forgetting", "", "Peking University", "Peking University", "\u5317\u4eac\u5927\u5b66, 5\u53f7, \u9890\u548c\u56ed\u8def, \u7a3b\u9999\u56ed\u5357\u793e\u533a, \u6d77\u6dc0\u533a, \u5317\u4eac\u5e02, 100871, \u4e2d\u56fd", "39.99223790", "116.30393816", "edu", "", "2018"], ["Intelligent Computing Methodologies", "Tongji University, Shanghai, China", "Tongji University", "Tongji University", "\u540c\u6d4e\u5927\u5b66, 1239, \u56db\u5e73\u8def, \u6c5f\u6e7e, \u8679\u53e3\u533a, \u4e0a\u6d77\u5e02, 200092, \u4e2d\u56fd", "31.28473925", "121.49694909", "edu", "", "2018"], ["An Intriguing Influence of Visual Data in Learning a Representation", "", "Carnegie Mellon University", "Carnegie Mellon University", "Carnegie Mellon University Silicon Valley, South Akron Road, ARC, Santa Clara County, California, 94035-0016, USA", "37.41021930", "-122.05965487", "edu", "", "2018"], ["Multiview Supervision By Registration", "", "University of Minnesota", "University of Minnesota", "WeismanArt, 333, East River Parkway, Marcy-Holmes, Phillips, Minneapolis, Hennepin County, Minnesota, 55455, USA", "44.97308605", "-93.23708813", "edu", "", "2018"], ["Deep Class-Wise Hashing: Semantics-Preserving Hashing via Class-wise Loss", "", "Member", "Member", "1322 N Inglewood Ave, Coffeyville, KS 67337, USA", "37.05826350", "-95.67914910", "edu", "", "2018"], ["Semantic Human Matting", "", "China", "China", "China", "35.86166000", "104.19539700", "edu", "", "2018"], ["Multi-evidence Filtering and Fusion for Multi-label Classification, Object Detection and Semantic Segmentation Based on Weakly Supervised Learning", "", "University of Hong Kong", "University of Hong Kong", "\u6d77\u6d0b\u79d1\u5b78\u7814\u7a76\u6240 The Swire Institute of Marine Science, \u9db4\u5480\u9053 Cape D'Aguilar Road, \u9db4\u5480\u4f4e\u96fb\u53f0 Cape D'Aguilar Low-Level Radio Station, \u77f3\u6fb3 Shek O, \u82bd\u83dc\u5751\u6751 Nga Choy Hang Tsuen, \u5357\u5340 Southern District, \u9999\u6e2f\u5cf6 Hong Kong Island, HK, \u4e2d\u56fd", "22.20814690", "114.25964115", "edu", "", "2018"], ["DeepDiary: Automatic Caption Generation for Lifelogging Image Streams.", "", "Indiana University", "Indiana University", "Indiana University East, West Cart Road, Richmond, Wayne County, Indiana, 47374, USA", "39.86948105", "-84.87956905", "edu", "", "2016"], ["Inferring Semantic Layout for Hierarchical Text-to-Image Synthesis", "", "University of Michigan", "University of Michigan", "University of Michigan, 500, Hayward Street, Ann Arbor, Washtenaw County, Michigan, 48109, USA", "42.29421420", "-83.71003894", "edu", "", "2018"], ["Progressive Visual Object Detection with Positive Training Examples Only", "Department of Signal Processing, Tampere University of Technology, Tampere, Finland", "Tampere University of Technology", "Tampere University of Technology", "TTY, 10, Korkeakoulunkatu, Finninm\u00e4ki, Hervanta, Tampere, Tampereen seutukunta, Pirkanmaa, L\u00e4nsi- ja Sis\u00e4-Suomen aluehallintovirasto, L\u00e4nsi-Suomi, Manner-Suomi, 33720, Suomi", "61.44964205", "23.85877462", "edu", "", "2015"], ["Text-to-Image Generation Using Multi-Instance StackGan", "", "Stanford University", "Stanford University", "Stanford University, Memorial Way, Stanford, Santa Clara County, California, 94305-6015, USA", "37.43131385", "-122.16936535", "edu", "", ""], ["Bundled Object Context for Referring Expressions", "Key Laboratory of Intelligent Information Processing of Chinese Academy of Sciences (CAS), Institute of Computing Technology, CAS, Beijing, China", "Chinese Academy of Sciences", "Chinese Academy of Sciences", "\u4e2d\u56fd\u79d1\u5b66\u9662\u5fc3\u7406\u7814\u7a76\u6240, 16, \u6797\u8403\u8def, \u671d\u9633\u533a / Chaoyang, \u5317\u4eac\u5e02, 100101, \u4e2d\u56fd", "40.00447950", "116.37023800", "edu", "", "2018"], ["CNN-based rate-distortion modeling for H.265/HEVC", "School of Remote Sensing and Information Engineering, Wuhan University Wuhan, China", "China", "China", "China", "35.86166000", "104.19539700", "edu", "", "2017"], ["Quantifying the visual concreteness of words and topics in multimodal datasets", "", "Cornell University", "Cornell University", "Cornell University, Forest Home Drive, Forest Home, Tompkins County, New York, 14853, USA", "42.45055070", "-76.47835130", "edu", "", "2018"], ["A task in a suit and a tie: paraphrase generation with semantic augmentation", "", "University of Texas at Austin", "University of Texas at Austin", "University of Texas at Austin, 1, East 23rd Street, The Drag, Austin, Travis County, Texas, 78712, USA", "30.28415100", "-97.73195598", "edu", "", "2018"], ["Towards Automatic Report Generation in Spine Radiology Using Weakly Supervised Framework", "", "China", "China", "China", "35.86166000", "104.19539700", "edu", "", "2018"], ["Pixel Objectness: Learning to Segment Generic Objects Automatically in Images and Videos", "", "Member", "Member", "1322 N Inglewood Ave, Coffeyville, KS 67337, USA", "37.05826350", "-95.67914910", "edu", "", "2018"], ["Show, Adapt and Tell: Adversarial Training of Cross-Domain Image Captioner", "", "Microsoft Research Asia", "Microsoft Live Labs Research, China", "China, Beijing Shi, Haidian Qu, Zhichun Rd, 49\u53f7\u5e0c\u683c\u739b709\u53f7 \u90ae\u653f\u7f16\u7801: 100080", "39.97721700", "116.33763200", "company", "", "2017"], ["Learning Visual Classifiers using Human-centric Annotations", "", "Microsoft", "Microsoft", "7021 S Memorial Dr, Tulsa, OK 74133, USA", "36.06303740", "-95.88099660", "edu", "", "2015"], ["FoveaNet: Perspective-Aware Urban Scene Parsing", "", "Tsinghua University", "Tsinghua University", "\u6e05\u534e\u5927\u5b66, 30, \u53cc\u6e05\u8def, \u4e94\u9053\u53e3, \u540e\u516b\u5bb6, \u6d77\u6dc0\u533a, 100084, \u4e2d\u56fd", "40.00229045", "116.32098908", "edu", "", "2017"], ["Exploiting Saliency for Object Segmentation from Image Level Labels", "", "University of Amsterdam", "University of Amsterdam", "Institute for Logic, Language and Computation (ILLC), 107, Science Park, Oost-Watergraafsmeer, Amsterdam, Oost, Amsterdam, Noord-Holland, Nederland, 1098XG, Nederland", "52.35536550", "4.95016440", "edu", "", "2017"], ["A Structured Model For Action Detection", "", "Carnegie Mellon University", "Carnegie Mellon University", "Carnegie Mellon University Silicon Valley, South Akron Road, ARC, Santa Clara County, California, 94035-0016, USA", "37.41021930", "-122.05965487", "edu", "", "2018"], ["RepMet: Representative-based metric learning for classification and one-shot object detection", "", "Technion", "Technion", "Haifa, 3200003, Israel", "32.77677830", "35.02312710", "edu", "", "2018"], ["What is the Role of Recurrent Neural Networks (RNNs) in an Image Caption Generator?", "", "University of Malta", "University of Malta", "University of Malta, Ring Road, Japanese Garden, L-Imsida, Malta, MSD 9027, Malta", "35.90232260", "14.48341890", "edu", "", "2017"], ["Batch-normalized recurrent highway networks", "", "Rochester Institute of Technology", "Rochester Institute of Technology", "Rochester Institute of Technology (RIT), 1, Lomb Memorial Drive, Bailey, Henrietta Town, Monroe County, New York, 14623, USA", "43.08250655", "-77.67121663", "edu", "", "2017"], ["Weakly Supervised Semantic Segmentation Using Web-Crawled Videos", "", "DGIST", "DGIST", "South Korea, Daegu, Dalseong-gun, Yuga-myeon, \ud14c\ud06c\ub178\uc911\uc559\ub300\ub85c 333", "35.70528600", "128.45710200", "edu", "", "2017"], ["Talking about other people: an endless range of possibilities", "", "University of Copenhagen", "University of Copenhagen", "K\u00f8benhavns Universitet, Krystalgade, K\u00f8dbyen, Vesterbro, K\u00f8benhavn, K\u00f8benhavns Kommune, Region Hovedstaden, 1165, Danmark", "55.68015020", "12.57232700", "edu", "", "2018"], ["What Actions are Needed for Understanding Human Actions in Videos?", "", "Carnegie Mellon University", "Carnegie Mellon University", "Carnegie Mellon University Silicon Valley, South Akron Road, ARC, Santa Clara County, California, 94035-0016, USA", "37.41021930", "-122.05965487", "edu", "", "2017"], ["Kobe University , NICT and University of Siegen at TRECVID 2017 AVS Task", "", "Kobe University", "Kobe University", "\u795e\u6238\u5927\u5b66, \u7058\u4e09\u7530\u7dda, \u7058\u533a, \u795e\u6238\u5e02, \u5175\u5eab\u770c, \u8fd1\u757f\u5730\u65b9, 657-00027, \u65e5\u672c", "34.72757140", "135.23710000", "edu", "", "2018"], ["DeepSign: Deep Learning based Traffic Sign Recognition", "The State Key Laboratory of Management and Control for Complex Systems, Institute of Automation, Chinese Academy of Sciences, Beijing, China", "Chinese Academy of Sciences", "Chinese Academy of Sciences", "\u4e2d\u56fd\u79d1\u5b66\u9662\u5fc3\u7406\u7814\u7a76\u6240, 16, \u6797\u8403\u8def, \u671d\u9633\u533a / Chaoyang, \u5317\u4eac\u5e02, 100101, \u4e2d\u56fd", "40.00447950", "116.37023800", "edu", "", "2018"]]}
\ No newline at end of file +{"id": "5e0f8c355a37a5a89351c02f174e7a5ddcb98683", "paper": {"paperId": "5e0f8c355a37a5a89351c02f174e7a5ddcb98683", "key": "coco", "title": "Microsoft COCO: Common Objects in Context", "journal": "Unknown", "address": "", "country": "", "address_type": "", "lat": "", "lng": "", "pdf_link": "https://arxiv.org/pdf/1405.0312.pdf", "report_link": "papers/5e0f8c355a37a5a89351c02f174e7a5ddcb98683.html", "citation_count": 999, "citations_geocoded": 574, "citations_unknown": 425, "citations_empty": 29, "citations_pdf": 799, "citations_doi": 193, "name": "COCO"}, "address": null, "citations": [["Generating Natural Video Descriptions via Multimodal Processing", "", "Carnegie Mellon University", "Carnegie Mellon University", "Carnegie Mellon University Silicon Valley, South Akron Road, ARC, Santa Clara County, California, 94035-0016, USA", "37.41021930", "-122.05965487", "edu", "", "United States", "2016"], ["Pyramid Scene Parsing Network", "", "SenseTime", "SenseTime", "China, Beijing Shi, Haidian Qu, WuDaoKou, Zhongguancun E Rd, 1\u53f7-7", "39.99300800", "116.32988200", "company", "1 Zhongguancun E Rd, Haidian Qu, China", "China", "2017"], ["Analysis of Spatial, Temporal, and Content Characteristics of Videos in the YFCC100M Dataset", "Yonsei University, Incheon, South Korea", "Yonsei University", "Yonsei University", "\uc5f0\uc138\ub300, \uc5f0\uc138\ub85c, \uc2e0\ucd0c\ub3d9, \ucc3d\ucc9c\ub3d9, \uc11c\ub300\ubb38\uad6c, \uc11c\uc6b8\ud2b9\ubcc4\uc2dc, 03789, \ub300\ud55c\ubbfc\uad6d", "37.56004060", "126.93692480", "edu", "", "South Korea", "2016"], ["Context-Aware Captions from Context-Agnostic Supervision", "", "Georgia Institute of Technology", "Georgia Institute of Technology", "Georgia Tech, Atlantic Drive Northwest, Bellwood, Rockdale, Atlanta, Fulton County, Georgia, 30318, USA", "33.77603300", "-84.39884086", "edu", "", "United States", "2017"], ["Understanding Convolution for Semantic Segmentation", "", "TuSimple", "TuSimple", "9191 Towne Centre Dr STE 600, San Diego, CA 92122, USA", "32.87344550", "-117.20656360", "edu", "", "", "2018"], ["GLA: Global\u2013Local Attention for Image Description", "Key Laboratory of Intelligent Information Processing, Institute of Computing Technology, Chinese Academy of Sciences, Beijing, China", "Chinese Academy of Sciences", "Chinese Academy of Sciences", "\u4e2d\u56fd\u79d1\u5b66\u9662\u5fc3\u7406\u7814\u7a76\u6240, 16, \u6797\u8403\u8def, \u671d\u9633\u533a / Chaoyang, \u5317\u4eac\u5e02, 100101, \u4e2d\u56fd", "40.00447950", "116.37023800", "edu", "", "China", "2018"], ["Generative Attention Model with Adversarial Self-learning for Visual Question Answering", "National University of Singapore, Singapore, Singapore", "National University of Singapore", "National University of Singapore", "NUS, Former 1936 British Outpost, Nepal Hill, Clementi, Southwest, 117542, Singapore", "1.29620180", "103.77689944", "edu", "", "Singapore", "2017"], ["Superpixel Filtering for Mean Field Inference in CRFs Integrated with Convolutional Neural Networks", "", "University of Oxford", "University of Oxford", "Radcliffe Camera, Radcliffe Square, Grandpont, Oxford, Oxon, South East, England, OX1 4AJ, UK", "51.75345380", "-1.25400997", "edu", "", "United Kingdom", "2015"], ["Computer Vision and Deep Learning for Automated Surveillance Technology", "", "Stanford University", "Stanford University", "Stanford University, Memorial Way, Stanford, Santa Clara County, California, 94305-6015, USA", "37.43131385", "-122.16936535", "edu", "", "United States", "2016"], ["Socratic Learning: Augmenting Generative Models to Incorporate Latent Subsets in Training Data", "", "Stanford University", "Stanford University", "Stanford University, Memorial Way, Stanford, Santa Clara County, California, 94305-6015, USA", "37.43131385", "-122.16936535", "edu", "", "United States", "2016"], ["Multi-Person Pose Estimation for PoseTrack with Enhanced Part Affinity Fields", "", "Beijing, China", "Beijing, China", "Beijing, China", "39.90419990", "116.40739630", "edu", "", "China", "2017"], ["ChestX-Ray8: Hospital-Scale Chest X-Ray Database and Benchmarks on Weakly-Supervised Classification and Localization of Common Thorax Diseases", "", "National Institutes of Health", "National Institutes of Health", "NIH, Pooks Hill, Bethesda, Montgomery County, Maryland, USA", "39.00041165", "-77.10327775", "edu", "", "United States", "2017"], ["Where to put the Image in an Image Caption Generator", "", "University of Malta", "University of Malta", "University of Malta, Ring Road, Japanese Garden, L-Imsida, Malta, MSD 9027, Malta", "35.90232260", "14.48341890", "edu", "", "Malta", "2018"], ["Towards Context-aware Interaction Recognition", "", "University of Adelaide", "University of Adelaide", "University of Adelaide, North Terrace, Adelaide, 5000, City of Adelaide, South Australia, 5000, Australia", "-34.91892260", "138.60423668", "edu", "", "Australia", "2017"], ["Regional Gating Neural Networks for Multi-label Image Classification", "", "Shanghai, China", "Shanghai, China", "Shanghai, China", "31.23039040", "121.47370210", "edu", "", "", "2016"], ["BDD100K: A Diverse Driving Video Database with Scalable Annotation Tooling", "", "Peking University", "Peking University", "\u5317\u4eac\u5927\u5b66, 5\u53f7, \u9890\u548c\u56ed\u8def, \u7a3b\u9999\u56ed\u5357\u793e\u533a, \u6d77\u6dc0\u533a, \u5317\u4eac\u5e02, 100871, \u4e2d\u56fd", "39.99223790", "116.30393816", "edu", "", "China", "2018"], ["The Color of the Cat is Gray: 1 Million Full-Sentences Visual Question Answering (FSVQA).", "", "University of Tokyo", "University of Tokyo", "\u6771\u4eac\u5927\u5b66 \u67cf\u30ad\u30e3\u30f3\u30d1\u30b9, \u5b66\u878d\u5408\u306e\u9053, \u67cf\u5e02, \u5343\u8449\u770c, \u95a2\u6771\u5730\u65b9, 277-8583, \u65e5\u672c", "35.90204480", "139.93622009", "edu", "", "Japan", "2016"], ["Accurate, Large Minibatch SGD: Training ImageNet in 1 Hour.", "", "Facebook", "Facebook", "250 Bryant St, Mountain View, CA 94041, USA", "37.39367170", "-122.08072620", "company", "Facebook, Mountain View, CA", "United States", "2017"], ["SIGNet: Semantic Instance Aided Unsupervised 3D Geometry Perception", "", "UC San Diego", "UC San Diego", "9500 Gilman Dr, La Jolla, CA 92093, USA", "32.88006040", "-117.23401350", "edu", "", "United States", "2018"], ["Action Classification via Concepts and Attributes", "", "Weizmann Institute of Science", "Weizmann Institute of Science", "\u05de\u05db\u05d5\u05df \u05d5\u05d9\u05e6\u05de\u05df \u05dc\u05de\u05d3\u05e2, \u05e9\u05d3\u05e8\u05ea \u05de\u05e8\u05db\u05d5\u05e1 \u05d6\u05d9\u05d5, \u05de\u05e2\u05d5\u05e0\u05d5\u05ea \u05e9\u05d9\u05d9\u05df, \u05d0\u05d7\u05d5\u05d6\u05d5\u05ea \u05d4\u05e0\u05e9\u05d9\u05d0, \u05e8\u05d7\u05d5\u05d1\u05d5\u05ea, \u05de\u05d7\u05d5\u05d6 \u05d4\u05de\u05e8\u05db\u05d6, NO, \u05d9\u05e9\u05e8\u05d0\u05dc", "31.90784990", "34.81334092", "edu", "", "Israel", "2018"], ["Automated Melanoma Recognition in Dermoscopy Images via Very Deep Residual Networks", "Department of Computer Science and Engineering, The Chinese University of Hong Kong, Hong Kong", "Chinese University of Hong Kong", "Chinese University of Hong Kong", "Hong Kong, \u99ac\u6599\u6c34\u6c60\u65c1\u8def", "22.41626320", "114.21093180", "edu", "", "China", "2017"], ["Learning to Learn: Model Regression Networks for Easy Small Sample Learning", "", "Robotics Institute", "Robotics Institute", "Institute for Field Robotics, \u0e1b\u0e23\u0e30\u0e0a\u0e32\u0e2d\u0e38\u0e17\u0e34\u0e28, \u0e01\u0e23\u0e38\u0e07\u0e40\u0e17\u0e1e\u0e21\u0e2b\u0e32\u0e19\u0e04\u0e23, \u0e40\u0e02\u0e15\u0e23\u0e32\u0e29\u0e0e\u0e23\u0e4c\u0e1a\u0e39\u0e23\u0e13\u0e30, \u0e01\u0e23\u0e38\u0e07\u0e40\u0e17\u0e1e\u0e21\u0e2b\u0e32\u0e19\u0e04\u0e23, 10140, \u0e1b\u0e23\u0e30\u0e40\u0e17\u0e28\u0e44\u0e17\u0e22", "13.65450525", "100.49423171", "edu", "", "Thailand", "2016"], ["Rethinking Atrous Convolution for Semantic Image Segmentation", "", "Google", "Google, Inc.", "1600 Amphitheatre Pkwy, Mountain View, CA 94043, USA", "37.42199990", "-122.08405750", "company", "Google, Mountain View, CA", "United States", "2017"], ["UMDFaces: An annotated face dataset for training deep networks", "University of Maryland, College Park", "University of Maryland", "University of Maryland", "The Grand Garage, 5, North Paca Street, Seton Hill, Baltimore, Maryland, 21201, USA", "39.28996850", "-76.62196103", "edu", "", "United States", "2017"], ["Grounding of Textual Phrases in Images by Reconstruction", "", "Max Planck Institute for Informatics", "Max Planck Institute for Informatics", "MPII, E1 4, Campus, Universit\u00e4t, Sankt Johann, Bezirk Mitte, Saarbr\u00fccken, Regionalverband Saarbr\u00fccken, Saarland, 66123, Deutschland", "49.25795660", "7.04577417", "edu", "", "Germany", "2016"], ["Image Captioning with Sentiment Terms via Weakly-Supervised Sentiment Dataset", "", "University of Tokyo", "University of Tokyo", "\u6771\u4eac\u5927\u5b66 \u67cf\u30ad\u30e3\u30f3\u30d1\u30b9, \u5b66\u878d\u5408\u306e\u9053, \u67cf\u5e02, \u5343\u8449\u770c, \u95a2\u6771\u5730\u65b9, 277-8583, \u65e5\u672c", "35.90204480", "139.93622009", "edu", "", "Japan", "2016"], ["iLab-20M: A Large-Scale Controlled Object Dataset to Investigate Deep Learning", "", "Amirkabir University of Technology", "Amirkabir University of Technology", "\u062f\u0627\u0646\u0634\u06af\u0627\u0647 \u0635\u0646\u0639\u062a\u06cc \u0627\u0645\u06cc\u0631\u06a9\u0628\u06cc\u0631, \u0648\u0644\u06cc \u0639\u0635\u0631, \u0645\u06cc\u062f\u0627\u0646 \u0648\u0644\u06cc\u0639\u0635\u0631, \u0645\u0646\u0637\u0642\u0647 \u06f6 \u0634\u0647\u0631 \u062a\u0647\u0631\u0627\u0646, \u062a\u0647\u0631\u0627\u0646, \u0628\u062e\u0634 \u0645\u0631\u06a9\u0632\u06cc \u0634\u0647\u0631\u0633\u062a\u0627\u0646 \u062a\u0647\u0631\u0627\u0646, \u0634\u0647\u0631\u0633\u062a\u0627\u0646 \u062a\u0647\u0631\u0627\u0646, \u0627\u0633\u062a\u0627\u0646 \u062a\u0647\u0631\u0627\u0646, \u0646\u0628\u0634 \u0628\u0631\u0627\u062f\u0631\u0627\u0646 \u0645\u0638\u0641\u0631, \u200f\u0627\u06cc\u0631\u0627\u0646\u200e", "35.70451400", "51.40972058", "edu", "", "Iran", "2016"], ["Social Image Tags as a Source of Word Embeddings: A Task-oriented Evaluation", "", "Waseda University", "Waseda University", "\u65e9\u7a32\u7530\u5927\u5b66 \u5317\u4e5d\u5dde\u30ad\u30e3\u30f3\u30d1\u30b9, 2-2, \u6709\u6bdb\u5f15\u91ce\u7dda, \u516b\u5e61\u897f\u533a, \u5317\u4e5d\u5dde\u5e02, \u798f\u5ca1\u770c, \u4e5d\u5dde\u5730\u65b9, 808-0135, \u65e5\u672c", "33.88987280", "130.70856205", "edu", "", "Japan", "2018"], ["Modeling Image Virality with Pairwise Spatial Transformer Networks", "", "MIT", "Massachusetts Institute", "MIT, Amherst Street, Cambridgeport, Cambridge, Middlesex County, Massachusetts, 02238, USA", "42.35839610", "-71.09567788", "edu", "", "United States", "2017"], ["Aided Action Recognition Using Single Images", "", "Lehigh University", "Lehigh University", "Lehigh University, Library Drive, Sayre Park, Bethlehem, Northampton County, Pennsylvania, 18015, USA", "40.60680280", "-75.37824880", "edu", "", "United States", "2017"], ["Aligning Text and Document Illustrations: Towards Visually Explainable Digital Humanities", "University of of Modena and Reggio Emilia", "University of of Modena and Reggio Emilia", "University of of Modena and Reggio Emilia", "Via Universit\u00e0, 4, 41121 Modena MO, Italy", "44.64510460", "10.92792680", "edu", "", "Italy", "2018"], ["Weakly- and Semi-supervised Panoptic Segmentation", "", "University of Oxford", "University of Oxford", "Radcliffe Camera, Radcliffe Square, Grandpont, Oxford, Oxon, South East, England, OX1 4AJ, UK", "51.75345380", "-1.25400997", "edu", "", "United Kingdom", "2018"], ["Learning Object Detectors from Scratch with Gated Recurrent Feature Pyramids", "", "Fudan University", "Fudan University", "\u590d\u65e6\u5927\u5b66, 220, \u90af\u90f8\u8def, \u4e94\u89d2\u573a\u8857\u9053, \u6768\u6d66\u533a, \u4e0a\u6d77\u5e02, 200433, \u4e2d\u56fd", "31.30104395", "121.50045497", "edu", "", "China", "2017"], ["Analysing object detectors from the perspective of co-occurring object categories", "", "Budapest, Hungary", "Budapest, Hungary", "Budapest, Hungary", "47.49791200", "19.04023500", "edu", "", "", "2018"], ["ScaleNet: Guiding Object Proposal Generation in Supermarkets and Beyond", "", "Shanghai University", "Shanghai University", "\u4e0a\u6d77\u5927\u5b66, \u9526\u79cb\u8def, \u5927\u573a\u9547, \u5b9d\u5c71\u533a (Baoshan), \u4e0a\u6d77\u5e02, 201906, \u4e2d\u56fd", "31.32235655", "121.38400941", "edu", "", "China", "2017"], ["Auto-DeepLab: Hierarchical Neural Architecture Search for Semantic Image Segmentation", "", "Stanford University", "Stanford University", "Stanford University, Memorial Way, Stanford, Santa Clara County, California, 94305-6015, USA", "37.43131385", "-122.16936535", "edu", "", "United States", "2019"], ["Image Caption with Endogenous\u2013Exogenous Attention", "School of Electronic and Information Engineering, Sun Yat-sen University, Guangzhou, China", "Sun Yat-Sen University", "Sun Yat-Sen University", "\u4e2d\u5927, \u65b0\u6e2f\u897f\u8def, \u9f99\u8239\u6ed8, \u5eb7\u4e50, \u6d77\u73e0\u533a (Haizhu), \u5e7f\u5dde\u5e02, \u5e7f\u4e1c\u7701, 510105, \u4e2d\u56fd", "23.09461185", "113.28788994", "edu", "", "China", "2019"], ["Identity-Aware Textual-Visual Matching with Latent Co-attention", "", "Chinese University of Hong Kong", "Chinese University of Hong Kong", "Hong Kong, \u99ac\u6599\u6c34\u6c60\u65c1\u8def", "22.41626320", "114.21093180", "edu", "", "China", "2017"], ["Multi-label image classification with recurrently learning semantic dependencies", "School of Computer and Information, Hefei University of Technology, Hefei, China", "Hefei University of Technology", "Hefei University of Technology", "\u5408\u80a5\u5de5\u4e1a\u5927\u5b66\uff08\u5c6f\u6eaa\u8def\u6821\u533a\uff09, 193\u53f7, \u5357\u4e00\u73af\u8def, \u822a\u8fd0\u5357\u6751, \u5305\u516c\u8857\u9053, \u5408\u80a5\u5e02\u533a, \u5408\u80a5\u5e02, \u5b89\u5fbd\u7701, 230009, \u4e2d\u56fd", "31.84691800", "117.29053367", "edu", "", "China", "2018"], ["Can You See the (Linguistic) Difference? Exploring Mass/Count Distinction in Vision", "", "University of Padova", "University of Padova", "Via Giovanni Gradenigo, 6, 35131 Padova PD, Italy", "45.40811720", "11.89437860", "edu", "University of Padova, Via Gradenigo, 6 - 35131- Padova, Italy", "Italy", "2017"], ["Dropout during inference as a model for neurological degeneration in an image captioning network", "", "University of Toronto", "University of Toronto", "University of Toronto, St. George Street, Bloor Street Culture Corridor, Old Toronto, Toronto, Ontario, M5S 1A5, Canada", "43.66333345", "-79.39769975", "edu", "", "Canada", "2018"], ["Weakly-Supervised Visual Grounding of Phrases with Linguistic Structures", "", "University of California, Davis", "University of California, Davis", "University of California, Davis, Apiary Drive, Yolo County, California, 95616-5270, USA", "38.53363490", "-121.79077264", "edu", "", "United States", "2017"], ["Deep Multimodal Learning: An Effective Method for Video Classification", "", "Tsinghua University", "Tsinghua University", "\u6e05\u534e\u5927\u5b66, 30, \u53cc\u6e05\u8def, \u4e94\u9053\u53e3, \u540e\u516b\u5bb6, \u6d77\u6dc0\u533a, 100084, \u4e2d\u56fd", "40.00229045", "116.32098908", "edu", "", "China", "2018"], ["Predicting Motivations of Actions by Leveraging Text", "", "University of Maryland", "University of Maryland", "The Grand Garage, 5, North Paca Street, Seton Hill, Baltimore, Maryland, 21201, USA", "39.28996850", "-76.62196103", "edu", "", "United States", "2016"], ["Semantic image segmentation using fully convolutional neural networks with multi-scale images and multi-scale dilated convolutions", "Pattern Recognition and Machine Learning Lab, Gachon University, Seongnam, Korea", "Gachon University", "Gachon University, Gyeonggi-do, South Korea", "1342 Seongnam-daero, Bokjeong-dong, Sujeong-gu, Seongnam-si, Gyeonggi-do, South Korea", "37.45074520", "127.12884740", "edu", "", "South Korea", "2018"], ["Cross-media Multi-level Alignment with Relation Attention Network", "", "Peking University", "Peking University", "\u5317\u4eac\u5927\u5b66, 5\u53f7, \u9890\u548c\u56ed\u8def, \u7a3b\u9999\u56ed\u5357\u793e\u533a, \u6d77\u6dc0\u533a, \u5317\u4eac\u5e02, 100871, \u4e2d\u56fd", "39.99223790", "116.30393816", "edu", "", "China", "2018"], ["Non-parametric human segmentation using support vector machine", "Yonsei University, Seoul 03722, South Korea", "Yonsei University", "Yonsei University", "\uc5f0\uc138\ub300, \uc5f0\uc138\ub85c, \uc2e0\ucd0c\ub3d9, \ucc3d\ucc9c\ub3d9, \uc11c\ub300\ubb38\uad6c, \uc11c\uc6b8\ud2b9\ubcc4\uc2dc, 03789, \ub300\ud55c\ubbfc\uad6d", "37.56004060", "126.93692480", "edu", "", "South Korea", "2016"], ["Multispectral Pedestrian Detection via Simultaneous Detection and Segmentation", "", "Zhejiang University", "Zhejiang University", "\u6d59\u6c5f\u5927\u5b66\u4e4b\u6c5f\u6821\u533a, \u4e4b\u6c5f\u8def, \u8f6c\u5858\u8857\u9053, \u897f\u6e56\u533a (Xihu), \u676d\u5dde\u5e02 Hangzhou, \u6d59\u6c5f\u7701, 310008, \u4e2d\u56fd", "30.19331415", "120.11930822", "edu", "", "China", "2018"], ["Toward Efficient Simultaneous Detection and Segmentation", "Peking University, National Engineering Laboratory for Video Technology, School of EE&CS, Beijing, China", "Peking University", "Peking University", "\u5317\u4eac\u5927\u5b66, 5\u53f7, \u9890\u548c\u56ed\u8def, \u7a3b\u9999\u56ed\u5357\u793e\u533a, \u6d77\u6dc0\u533a, \u5317\u4eac\u5e02, 100871, \u4e2d\u56fd", "39.99223790", "116.30393816", "edu", "", "China", "2018"], ["Spatially Adaptive Computation Time for Residual Networks", "", "Google", "Google, Inc.", "1600 Amphitheatre Pkwy, Mountain View, CA 94043, USA", "37.42199990", "-122.08405750", "company", "Google, Mountain View, CA", "United States", "2017"], ["Pre-gen Metrics: Predicting Caption Quality Metrics Without Generating Captions", "University of Malta, Msida, Malta", "University of Malta", "University of Malta", "University of Malta, Ring Road, Japanese Garden, L-Imsida, Malta, MSD 9027, Malta", "35.90232260", "14.48341890", "edu", "", "Malta", "2018"], ["Learning to Evaluate Image Captioning", "", "Cornell University", "Cornell University", "Cornell University, Forest Home Drive, Forest Home, Tompkins County, New York, 14853, USA", "42.45055070", "-76.47835130", "edu", "", "United States", "2018"], ["Style Transfer at 100+ FPS Via Sub-Pixel Super-Resolution", "South China University of Technology", "South China University of Technology", "South China University of Technology", "\u534e\u5357\u7406\u5de5\u5927\u5b66, \u5927\u5b66\u57ce\u4e2d\u73af\u4e1c\u8def, \u5e7f\u5dde\u5927\u5b66\u57ce, \u65b0\u9020, \u756a\u79ba\u533a (Panyu), \u5e7f\u5dde\u5e02, \u5e7f\u4e1c\u7701, 510006, \u4e2d\u56fd", "23.05020420", "113.39880323", "edu", "", "China", "2018"], ["A Semi-supervised Framework for Image Captioning", "", "ETH Zurich", "ETH Zurich", "R\u00e4mistrasse 101, 8092 Z\u00fcrich, Switzerland", "47.37631300", "8.54766990", "edu", "", "Switzerland", "2016"], ["Language Models for Image Captioning: The Quirks and What Works", "", "Microsoft", "Microsoft Corporation, Redmond, WA, USA", "One Microsoft Way, Redmond, WA 98052, USA", "47.64233180", "-122.13693020", "company", "", "United States", "2015"], ["Automatic Dataset Augmentation", "", "Harbin Institute of Technology", "Harbin Institute of Technology", "\u54c8\u5c14\u6ee8\u5de5\u4e1a\u5927\u5b66, \u53f8\u4ee4\u8857, \u5357\u5c97\u533a, \u54c8\u5c14\u6ee8\u5e02 / Harbin, \u9ed1\u9f99\u6c5f\u7701, 150000, \u4e2d\u56fd", "45.74139210", "126.62552755", "edu", "", "China", "2017"], ["The Helping Hand: An Assistive Manipulation Framework Using Augmented Reality and Tongue-Drive Interfaces", "Institute for Robotics and Intelligent Machines, Georgia Institute of Technology, GA, USA", "Georgia Institute of Technology", "Georgia Institute of Technology", "Georgia Tech, Atlantic Drive Northwest, Bellwood, Rockdale, Atlanta, Fulton County, Georgia, 30318, USA", "33.77603300", "-84.39884086", "edu", "", "United States", "2018"], ["Consistent Optimization for Single-Shot Object Detection", "", "Tsinghua University", "Tsinghua University", "\u6e05\u534e\u5927\u5b66, 30, \u53cc\u6e05\u8def, \u4e94\u9053\u53e3, \u540e\u516b\u5bb6, \u6d77\u6dc0\u533a, 100084, \u4e2d\u56fd", "40.00229045", "116.32098908", "edu", "", "China", "2019"], ["Object Proposal Generation With Fully Convolutional Networks", "Keio-National University of Singapore (NUS) Connective Ubiquitous Technology for Embodiments Center, Interactive and Digital Media Institute, NUS, Singapore", "Singapore", "Singapore", "Singapore", "1.35208300", "103.81983600", "edu", "", "Singapore", "2018"], ["ProNet: Learning to Propose Object-Specific Boxes for Cascaded Neural Networks", "", "University of California, Berkeley", "University of California, Berkeley", "Berkeley Art Museum and Pacific Film Archive, Bancroft Way, Southside, Berkeley, Alameda County, California, 94720-1076, USA", "37.86871260", "-122.25586815", "edu", "", "United States", "2016"], ["Revisiting Graph Construction for Fast Image Segmentation", "", "Xiamen University", "Xiamen University", "\u53a6\u95e8\u5927\u5b66, \u601d\u660e\u5357\u8def Siming South Road, \u601d\u660e\u533a, \u601d\u660e\u533a (Siming), \u53a6\u95e8\u5e02 / Xiamen, \u798f\u5efa\u7701, 361005, \u4e2d\u56fd", "24.43994190", "118.09301781", "edu", "", "China", "2018"], ["Large-Scale Sparse Learning From Noisy Tags for Semantic Segmentation", "Key Laboratory of Machine Perception, School of Electronics Engineering and Computer Science, Peking University, Beijing, China", "Peking University", "Peking University", "\u5317\u4eac\u5927\u5b66, 5\u53f7, \u9890\u548c\u56ed\u8def, \u7a3b\u9999\u56ed\u5357\u793e\u533a, \u6d77\u6dc0\u533a, \u5317\u4eac\u5e02, 100871, \u4e2d\u56fd", "39.99223790", "116.30393816", "edu", "", "China", "2016"], ["Detection of valuable left-behind items in vehicle cabins", "Visual Information Lab, University of Bristol, UK", "University of Bristol", "University of Bristol", "Victoria Rooms, Whiteladies Road, Cliftonwood, Spike Island, Bristol, City of Bristol, South West England, England, BS8 2PY, UK", "51.45848370", "-2.60977520", "edu", "", "United Kingdom", "2017"], ["Automatic Generation of Grounded Visual Questions", "", "Tianjin University", "Tianjin University", "\u6cf0\u5c71\u822a\u7a7a\u6e2f/\u5929\u6d25\u5927\u53a6, \u67a3\u884c\u8def, \u67a3\u884c \u9ad8\u738b\u5bfa, \u957f\u57ce\u8def, \u5927\u6cb3, \u5cb1\u5cb3\u533a (Daiyue), \u6cf0\u5b89\u5e02, \u5c71\u4e1c\u7701, 271000, \u4e2d\u56fd", "36.20304395", "117.05842113", "edu", "", "China", "2017"], ["Multi-Networks Joint Learning for Large-Scale Cross-Modal Retrieval", "University of Texas at San Antonio, San Antonio, TX, USA", "University of Texas at San Antonio", "University of Texas at San Antonio", "UTSA, Paseo Principal, San Antonio, Bexar County, Texas, 78249-1620, USA", "29.58333105", "-98.61944505", "edu", "", "United States", "2017"], ["Learning to Classify Fine-Grained Categories with Privileged Visual-Semantic Misalignment", "Institute of Automation, CAS Center for Excellence in Brain Science and Intelligence Technology, Chinese Academy of Sciences, Beijing, P.R. China", "Chinese Academy of Sciences", "Chinese Academy of Sciences", "\u4e2d\u56fd\u79d1\u5b66\u9662\u5fc3\u7406\u7814\u7a76\u6240, 16, \u6797\u8403\u8def, \u671d\u9633\u533a / Chaoyang, \u5317\u4eac\u5e02, 100101, \u4e2d\u56fd", "40.00447950", "116.37023800", "edu", "", "China", "2017"], ["Learning a Recurrent Visual Representation for Image Caption Generation", "", "Microsoft", "Microsoft Corporation, Redmond, WA, USA", "One Microsoft Way, Redmond, WA 98052, USA", "47.64233180", "-122.13693020", "company", "", "United States", "2014"], ["Intelligent surveillance system for abandoned luggage", "Elektrik - Elektronik M\u00fchendisli\u011fi B\u00f6l\u00fcm\u00fc, Orta Do\u011fu Teknik \u00dcniversitesi, Kuzey K\u0131br\u0131s Kamp\u00fcs\u00fc, Kalkanl\u0131, Kuzey K\u0131br\u0131s", "Elektrik - Elektronik M\u00fchendisli\u011fi B\u00f6l\u00fcm\u00fc, Orta Do\u011fu Teknik \u00dcniversitesi, Kuzey K\u0131br\u0131s Kamp\u00fcs\u00fc, Kalkanl\u0131, Kuzey K\u0131br\u0131s", "Elektrik - Elektronik M\u00fchendisli\u011fi B\u00f6l\u00fcm\u00fc, Orta Do\u011fu Teknik \u00dcniversitesi, Kuzey K\u0131br\u0131s Kamp\u00fcs\u00fc, Kalkanl\u0131, Kuzey K\u0131br\u0131s", "Kalkanl\u0131, G\u00fczelyurt", "35.24908700", "33.02407600", "edu", "", "Turkey", "2018"], ["Exploring Visual Relationship for Image Captioning", "", "Sun Yat-Sen University", "Sun Yat-Sen University", "\u4e2d\u5927, \u65b0\u6e2f\u897f\u8def, \u9f99\u8239\u6ed8, \u5eb7\u4e50, \u6d77\u73e0\u533a (Haizhu), \u5e7f\u5dde\u5e02, \u5e7f\u4e1c\u7701, 510105, \u4e2d\u56fd", "23.09461185", "113.28788994", "edu", "", "China", "2018"], ["Learning Transferrable Knowledge for Semantic Segmentation with Deep Convolutional Neural Network", "", "University of Michigan", "University of Michigan", "University of Michigan, 500, Hayward Street, Ann Arbor, Washtenaw County, Michigan, 48109, USA", "42.29421420", "-83.71003894", "edu", "", "United States", "2016"], ["Deep affordance learning for single- and multiple-instance object detection", "School of Electrical and Electronic Engineering Nanyang Technological University, Singapore Block S2.1, 50 Nanyang Avenue, Singapore 639798", "Singapore", "Singapore", "Singapore", "1.35208300", "103.81983600", "edu", "", "Singapore", "2017"], ["ESPNet: Efficient Spatial Pyramid of Dilated Convolutions for Semantic Segmentation", "", "University of Washington", "University of Washington", "University of Washington, Rainier Vista, Montlake, University District, Seattle, King County, Washington, 98195, USA", "47.65432380", "-122.30800894", "edu", "", "United States", "2018"], ["A Multi-Layer Approach to Superpixel-based Higher-order Conditional Random Field for Semantic Image Segmentation", "", "University of Texas at Arlington", "University of Texas at Arlington", "University of Texas at Arlington, South Nedderman Drive, Arlington, Tarrant County, Texas, 76010, USA", "32.72836830", "-97.11201835", "edu", "", "United States", "2018"], ["Scene Image Synthesis from Natural Sentences Using Hierarchical Syntactic Analysis", "The University of Tokyo, Tokyo, Japan", "University of Tokyo", "University of Tokyo", "\u6771\u4eac\u5927\u5b66 \u67cf\u30ad\u30e3\u30f3\u30d1\u30b9, \u5b66\u878d\u5408\u306e\u9053, \u67cf\u5e02, \u5343\u8449\u770c, \u95a2\u6771\u5730\u65b9, 277-8583, \u65e5\u672c", "35.90204480", "139.93622009", "edu", "", "Japan", "2016"], ["A Mask Regional Convolutional Neural Network Model for Segmenting Real Time Traffic Images", "Department of Electronics and Communication Engineering, Malaviya National Institute of Technology, Jaipur, Rajasthan, 302017, India", "India", "India", "India", "20.59368400", "78.96288000", "edu", "", "", "2018"], ["Terahertz Image Detection with the Improved Faster Region-Based Convolutional Neural Network", "", "Xidian University", "Xidian University", "Xidian University (New Campus), 266\u53f7, \u94f6\u674f\u5927\u9053, \u5357\u96f7\u6751, \u957f\u5b89\u533a (Chang'an), \u897f\u5b89\u5e02, \u9655\u897f\u7701, 710126, \u4e2d\u56fd", "34.12358250", "108.83546000", "edu", "", "China", "2018"], ["Image Classification using Transfer Learning from Siamese Networks based on Text Metadata Similarity", "", "Stanford University", "Stanford University", "Stanford University, Memorial Way, Stanford, Santa Clara County, California, 94305-6015, USA", "37.43131385", "-122.16936535", "edu", "", "United States", "2016"], ["BubbleView: an alternative to eye-tracking for crowdsourcing image importance", "", "MIT CSAIL", "MIT CSAIL", "32 Vassar St, Cambridge, MA 02139, USA", "42.36194070", "-71.09043780", "edu", "", "United States", "2017"], ["Benchmarking and Error Diagnosis in Multi-instance Pose Estimation", "", "California Institute of Technology", "California Institute of Technology", "California Institute of Technology, San Pasqual Walk, Madison Heights, Pasadena, Los Angeles County, California, 91126, USA", "34.13710185", "-118.12527487", "edu", "", "United States", "2017"], ["Meta Networks for Neural Style Transfer", "", "Peking University", "Peking University", "\u5317\u4eac\u5927\u5b66, 5\u53f7, \u9890\u548c\u56ed\u8def, \u7a3b\u9999\u56ed\u5357\u793e\u533a, \u6d77\u6dc0\u533a, \u5317\u4eac\u5e02, 100871, \u4e2d\u56fd", "39.99223790", "116.30393816", "edu", "", "China", "2017"], ["Revisiting Unreasonable Effectiveness of Data in Deep Learning Era", "", "Carnegie Mellon University", "Carnegie Mellon University", "Carnegie Mellon University Silicon Valley, South Akron Road, ARC, Santa Clara County, California, 94035-0016, USA", "37.41021930", "-122.05965487", "edu", "", "United States", "2017"], ["Semantic Amodal Segmentation", "", "Rutgers University", "Rutgers University", "Rutgers Cook Campus - North, Biel Road, New Brunswick, Middlesex County, New Jersey, 08901, USA", "40.47913175", "-74.43168868", "edu", "", "United States", "2017"], ["Deep Feature Pyramid Reconfiguration for Object Detection", "", "Tsinghua University", "Tsinghua University", "\u6e05\u534e\u5927\u5b66, 30, \u53cc\u6e05\u8def, \u4e94\u9053\u53e3, \u540e\u516b\u5bb6, \u6d77\u6dc0\u533a, 100084, \u4e2d\u56fd", "40.00229045", "116.32098908", "edu", "", "China", "2018"], ["Person Search via a Mask-Guided Two-Stream CNN Model", "", "University of Sydney", "University of Sydney", "USyd, Fisher Road, Camperdown, Sydney, NSW, 2006, Australia", "-33.88890695", "151.18943366", "edu", "", "Australia", "2018"], ["Employing Weak Annotations for Medical Image Analysis Problems", "", "Nagoya University", "Nagoya University", "SuperDARN (Hokkaido West), \u592a\u8f9b\u7b2c1\u652f\u7dda\u6797\u9053, \u9678\u5225\u753a, \u8db3\u5bc4\u90e1, \u5341\u52dd\u7dcf\u5408\u632f\u8208\u5c40, \u5317\u6d77\u9053, \u5317\u6d77\u9053\u5730\u65b9, \u65e5\u672c", "43.53750985", "143.60768225", "edu", "", "Japan", "2017"], ["Watching the TV Watchers", "Georgia Institute of Technology, Center for Behavioral Imaging and School of Electrical and Computer Engineering, Atlanta, GA, USA", "Georgia Institute of Technology", "Georgia Institute of Technology", "Georgia Tech, Atlantic Drive Northwest, Bellwood, Rockdale, Atlanta, Fulton County, Georgia, 30318, USA", "33.77603300", "-84.39884086", "edu", "", "United States", "2018"], ["Deep Priority Hashing", "", "Tsinghua University", "Tsinghua University", "\u6e05\u534e\u5927\u5b66, 30, \u53cc\u6e05\u8def, \u4e94\u9053\u53e3, \u540e\u516b\u5bb6, \u6d77\u6dc0\u533a, 100084, \u4e2d\u56fd", "40.00229045", "116.32098908", "edu", "", "China", "2018"], ["Single-Shot Bidirectional Pyramid Networks for High-Quality Object Detection", "", "Zhejiang University", "Zhejiang University", "\u6d59\u6c5f\u5927\u5b66\u4e4b\u6c5f\u6821\u533a, \u4e4b\u6c5f\u8def, \u8f6c\u5858\u8857\u9053, \u897f\u6e56\u533a (Xihu), \u676d\u5dde\u5e02 Hangzhou, \u6d59\u6c5f\u7701, 310008, \u4e2d\u56fd", "30.19331415", "120.11930822", "edu", "", "China", "2018"], ["Neighbourhood Watch: Referring Expression Comprehension via Language-guided Graph Attention Networks", "", "University of Adelaide", "University of Adelaide", "University of Adelaide, North Terrace, Adelaide, 5000, City of Adelaide, South Australia, 5000, Australia", "-34.91892260", "138.60423668", "edu", "", "Australia", "2018"], ["Text and Object Detection on Billboards", "Faculty of Information Technology, King Mongkut\u2019s Institute of Technology Ladkrabang, Bangkok, 10520, Thailand", "Faculty of Information Technology, King Mongkut\u2019s Institute of Technology Ladkrabang, Bangkok, 10520, Thailand", "Faculty of Information Technology, King Mongkut\u2019s Institute of Technology Ladkrabang, Bangkok, 10520, Thailand", "1 Thanon Chalong Krung, Lat Krabang, Khet Lat Krabang, Krung Thep Maha Nakhon 10520, Thailand", "13.73095530", "100.78117740", "edu", "", "Thailand", "2018"], ["Parallel Attention: A Unified Framework for Visual Object Discovery Through Dialogs and Queries", "", "University of Adelaide", "University of Adelaide", "University of Adelaide, North Terrace, Adelaide, 5000, City of Adelaide, South Australia, 5000, Australia", "-34.91892260", "138.60423668", "edu", "", "Australia", "2018"], ["Learning Instance-Aware Object Detection Using Determinantal Point Processes", "", "Seoul National University", "Seoul National University", "\uc11c\uc6b8\ub300\ud559\uad50, \uc11c\ud638\ub3d9\ub85c, \uc11c\ub454\ub3d9, \uad8c\uc120\uad6c, \uc218\uc6d0\uc2dc, \uacbd\uae30, 16614, \ub300\ud55c\ubbfc\uad6d", "37.26728000", "126.98411510", "edu", "", "South Korea", "2018"], ["Maximum Classifier Discrepancy for Unsupervised Domain Adaptation", "", "University of Tokyo", "University of Tokyo", "\u6771\u4eac\u5927\u5b66 \u67cf\u30ad\u30e3\u30f3\u30d1\u30b9, \u5b66\u878d\u5408\u306e\u9053, \u67cf\u5e02, \u5343\u8449\u770c, \u95a2\u6771\u5730\u65b9, 277-8583, \u65e5\u672c", "35.90204480", "139.93622009", "edu", "", "Japan", "2018"], ["Multi-oriented Scene Text Detection via Corner Localization and Region Segmentation", "", "National University of Singapore", "National University of Singapore", "NUS, Former 1936 British Outpost, Nepal Hill, Clementi, Southwest, 117542, Singapore", "1.29620180", "103.77689944", "edu", "", "Singapore", "2018"], ["Mind Your Language: Abuse and Offense Detection for Code-Switched Languages", "", "Singapore", "Singapore", "Singapore", "1.35208300", "103.81983600", "edu", "", "Singapore", "2018"], ["Efficient Video Object Segmentation via Network Modulation", "", "Google", "Google, Inc.", "1600 Amphitheatre Pkwy, Mountain View, CA 94043, USA", "37.42199990", "-122.08405750", "company", "Google, Mountain View, CA", "United States", "2018"], ["Strong-Weak Distribution Alignment for Adaptive Object Detection.", "", "Boston University", "Boston University", "BU, Bay State Road, Fenway, Boston, Suffolk County, Massachusetts, 02215, USA", "42.35042530", "-71.10056114", "edu", "", "United States", "2018"], ["Revisiting Dilated Convolution: A Simple Approach for Weakly- and Semi-Supervised Semantic Segmentation", "", "IBM Thomas J. Watson Research Center", "IBM Thomas J. Watson Research Center", "IBM Yorktown research lab, Adams Road, Millwood, Town of New Castle, Westchester County, New York, 10562, USA", "41.21002475", "-73.80407056", "company", "", "United States", "2018"], ["Detecting Sex From Handwritten Examples", "Fab Lab, Independent University Bangladesh, Dhaka, Bangladesh", "Independent University Bangladesh", "Fab Lab, Independent University Bangladesh, Dhaka, Bangladesh", "Independent University, Bangladesh Plot 16, \u0986\u09ab\u09a4\u09be\u09ac \u0989\u09a6\u09cd\u09a6\u09bf\u09a8 \u0986\u09b9\u09ae\u09c7\u09a6 \u09b0\u09cb\u09a1, \u09a2\u09be\u0995\u09be, Bangladesh", "23.81524690", "90.42796720", "edu", "", "Bangladesh", "2018"], ["Zero-Shot Object Detection: Learning to Simultaneously Recognize and Localize Novel Concepts", "", "Australian National University", "Australian National University", "Canberra ACT 0200, Australia", "-35.27769990", "149.11852700", "edu", "", "Australia", "2018"], ["Training CNNs from Synthetic Data for Part Handling in Industrial Environments", "Mercedes-Benz-Cars Daimler AG, Stuttgart, Germany", "Mercedes-Benz-Cars Daimler AG, Stuttgart, Germany", "Mercedes-Benz-Cars Daimler AG, Stuttgart, Germany", "Stuttgarter Str. 90, 70736 Fellbach, Germany", "48.81313800", "9.26374900", "edu", "", "", "2018"], ["Query : \" A man in a red sweatshirt performing breakdance \"", "", "University of California, Berkeley", "University of California, Berkeley", "Berkeley Art Museum and Pacific Film Archive, Bancroft Way, Southside, Berkeley, Alameda County, California, 94720-1076, USA", "37.86871260", "-122.25586815", "edu", "", "United States", "2018"], ["Semantic segmentation based on iterative contraction and merging", "National Chiao Tung University, Hsinchu, Taiwan", "National Chiao Tung University", "National Chiao Tung University", "NCTU;\u4ea4\u5927;\u4ea4\u901a\u5927\u5b78;\u4ea4\u5927\u5149\u5fa9\u6821\u5340;\u4ea4\u901a\u5927\u5b78\u5149\u5fa9\u6821\u5340, 1001, \u5927\u5b78\u8def, \u5149\u660e\u91cc, \u8d64\u571f\u5d0e, \u6771\u5340, \u65b0\u7af9\u5e02, 30010, \u81fa\u7063", "24.78676765", "120.99724412", "edu", "", "Taiwan", "2017"], ["Image captioning using deep neural architectures", "", "India", "India", "India", "20.59368400", "78.96288000", "edu", "", "", "2017"], ["Training Constrained Deconvolutional Networks for Road Scene Semantic Segmentation", "", "Cambridge University", "Cambridge University", "University, Cambridge Road, Old Portsmouth, Portsmouth, South East, England, PO1 2HB, UK", "50.79440260", "-1.09717480", "edu", "", "United Kingdom", "2016"], ["A sequential guiding network with attention for image captioning", "", "North China Electric Power University", "North China Electric Power University", "\u534e\u5317\u7535\u529b\u5927\u5b66, \u6c38\u534e\u5317\u5927\u8857, \u83b2\u6c60\u533a, \u4fdd\u5b9a\u5e02, \u83b2\u6c60\u533a (Lianchi), \u4fdd\u5b9a\u5e02, \u6cb3\u5317\u7701, 071000, \u4e2d\u56fd", "38.87604460", "115.49738730", "edu", "", "China", "2018"], ["Discriminative Learning of Open-Vocabulary Object Retrieval and Localization by Negative Phrase Augmentation", "", "University of Tokyo", "University of Tokyo", "\u6771\u4eac\u5927\u5b66 \u67cf\u30ad\u30e3\u30f3\u30d1\u30b9, \u5b66\u878d\u5408\u306e\u9053, \u67cf\u5e02, \u5343\u8449\u770c, \u95a2\u6771\u5730\u65b9, 277-8583, \u65e5\u672c", "35.90204480", "139.93622009", "edu", "", "Japan", "2018"], ["A Vision-based Transfer Learning Approach for Recognizing Behavioral Symptoms in People with Dementia", "", "Edge Hill University", "Edge Hill University", "Edge Hill University, St Helens Road, West Lancashire, Lancs, North West England, England, L39 4QP, UK", "53.55821550", "-2.86904651", "edu", "", "United Kingdom", "2018"], ["One-shot Texture Segmentation", "", "University of T\u00fcbingen", "University of T\u00fcbingen", "Geschwister-Scholl-Platz, 72074 T\u00fcbingen, Germany", "48.52947820", "9.04377400", "edu", "", "", "2018"], ["Self-supervised Learning of Motion Capture", "", "University of Pittsburgh", "University of Pittsburgh", "University of Pittsburgh, Sutherland Drive, West Oakland, PGH, Allegheny County, Pennsylvania, 15240, USA", "40.44415295", "-79.96243993", "edu", "", "United States", "2017"], ["Visual Dialog", "", "Georgia Institute of Technology", "Georgia Institute of Technology", "Georgia Tech, Atlantic Drive Northwest, Bellwood, Rockdale, Atlanta, Fulton County, Georgia, 30318, USA", "33.77603300", "-84.39884086", "edu", "", "United States", "2017"], ["Chat-crowd: A Dialog-based Platform for Visual Layout Composition", "", "University of Virginia", "University of Virginia", "University of Virginia, Rotunda Alley, Carr's Hill, Albemarle County, Virginia, 22904-4119, USA", "38.03536820", "-78.50353220", "edu", "", "United States", "2018"], ["VISER: Visual Self-Regularization", "", "University of Washington", "University of Washington", "University of Washington, Rainier Vista, Montlake, University District, Seattle, King County, Washington, 98195, USA", "47.65432380", "-122.30800894", "edu", "", "United States", "2018"], ["BoxSup: Exploiting Bounding Boxes to Supervise Convolutional Networks for Semantic Segmentation", "", "Microsoft", "Microsoft Corporation, Redmond, WA, USA", "One Microsoft Way, Redmond, WA 98052, USA", "47.64233180", "-122.13693020", "company", "", "United States", "2015"], ["Visual Referring Expression Recognition: What Do Systems Actually Learn?", "", "Carnegie Mellon University", "Carnegie Mellon University", "Carnegie Mellon University Silicon Valley, South Akron Road, ARC, Santa Clara County, California, 94035-0016, USA", "37.41021930", "-122.05965487", "edu", "", "United States", "2018"], ["Auto-Encoding Scene Graphs for Image Captioning", "", "Nanyang Technological University", "Nanyang Technological University", "NTU, Faculty Avenue, Jurong West, Southwest, 637460, Singapore", "1.34841040", "103.68297965", "edu", "", "Singapore", "2018"], ["Fast Object Localization Using a CNN Feature Map Based Multi-Scale Search", "", "University of California", "University of California", "Berkeley, CA, USA", "37.87189920", "-122.25853990", "edu", "", "United States", "2016"], ["Dense Image Representation with Spatial Pyramid VLAD Coding of CNN for Locally Robust Captioning", "", "University of Tokyo", "University of Tokyo", "\u6771\u4eac\u5927\u5b66 \u67cf\u30ad\u30e3\u30f3\u30d1\u30b9, \u5b66\u878d\u5408\u306e\u9053, \u67cf\u5e02, \u5343\u8449\u770c, \u95a2\u6771\u5730\u65b9, 277-8583, \u65e5\u672c", "35.90204480", "139.93622009", "edu", "", "Japan", "2016"], ["G-Distillation: Reducing Overconfident Errors on Novel Samples", "", "University of Illinois, Urbana-Champaign", "University of Illinois, Urbana-Champaign", "B-3, South Mathews Avenue, Urbana, Champaign County, Illinois, 61801, USA", "40.11116745", "-88.22587665", "edu", "", "United States", "2018"], ["Proposal Incorporating Structural Bias into Neural Networks", "", "Carnegie Mellon University", "Carnegie Mellon University", "Carnegie Mellon University Silicon Valley, South Akron Road, ARC, Santa Clara County, California, 94035-0016, USA", "37.41021930", "-122.05965487", "edu", "", "United States", "2017"], ["Image Captioning with an Intermediate Attributes Layer", "", "University of Adelaide", "University of Adelaide", "University of Adelaide, North Terrace, Adelaide, 5000, City of Adelaide, South Australia, 5000, Australia", "-34.91892260", "138.60423668", "edu", "", "Australia", "2015"], ["Weakly Supervised Attention Learning for Textual Phrases Grounding", "", "University of California, Irvine", "University of California, Irvine", "Irvine, CA 92697, USA", "33.64049520", "-117.84429620", "edu", "", "", "2018"], ["Classification of Crash and Near-Crash Events from Dashcam Videos and Telematics", "Verizon Connect Research, via Paisiello 16-20, Florence, 50144, Italy", "Verizon Connect Research, via Paisiello 16-20, Florence, 50144, Italy", "Verizon Connect Research, via Paisiello 16-20, Florence, 50144, Italy", "Via Giovanni Paisiello, 20, 50144 Firenze FI, Italy", "43.78205540", "11.23259400", "edu", "", "Italy", "2018"], ["Identifying Most Walkable Direction for Navigation in an Outdoor Environment", "", "University of Washington", "University of Washington", "University of Washington, Rainier Vista, Montlake, University District, Seattle, King County, Washington, 98195, USA", "47.65432380", "-122.30800894", "edu", "", "United States", "2017"], ["WebVision Database: Visual Learning and Understanding from Web Data", "", "ETH Zurich", "ETH Zurich", "R\u00e4mistrasse 101, 8092 Z\u00fcrich, Switzerland", "47.37631300", "8.54766990", "edu", "", "Switzerland", "2017"], ["Pose Flow: Efficient Online Pose Tracking", "", "Shanghai, China", "Shanghai, China", "Shanghai, China", "31.23039040", "121.47370210", "edu", "", "", "2018"], ["MetaAnchor: Learning to Detect Objects with Customized Anchors", "", "Fudan University", "Fudan University", "\u590d\u65e6\u5927\u5b66, 220, \u90af\u90f8\u8def, \u4e94\u89d2\u573a\u8857\u9053, \u6768\u6d66\u533a, \u4e0a\u6d77\u5e02, 200433, \u4e2d\u56fd", "31.30104395", "121.50045497", "edu", "", "China", "2018"], ["Image Description using Deep Neural Networks", "", "Rochester Institute of Technology", "Rochester Institute of Technology", "Rochester Institute of Technology (RIT), 1, Lomb Memorial Drive, Bailey, Henrietta Town, Monroe County, New York, 14623, USA", "43.08250655", "-77.67121663", "edu", "", "United States", "2016"], ["Combining Weakly and Webly Supervised Learning for Classifying Food Images", "", "SRI International", "SRI International", "SRI International Building, West 1st Street, Menlo Park, San Mateo County, California, 94025, USA", "37.45857960", "-122.17560525", "edu", "", "United States", "2017"], ["Measuring and Modifying the Intrinsic Memorability of Images", "", "MIT", "Massachusetts Institute", "MIT, Amherst Street, Cambridgeport, Cambridge, Middlesex County, Massachusetts, 02238, USA", "42.35839610", "-71.09567788", "edu", "", "United States", "2015"], ["SSP: Supervised Sparse Projections for Large-Scale Retrieval in High Dimensions", "", "University of British Columbia", "University of British Columbia", "University of British Columbia, Eagles Drive, Hawthorn Place, University Endowment Lands, Metro Vancouver, British Columbia, V6T, Canada", "49.25839375", "-123.24658161", "edu", "", "Canada", "2016"], ["Semantic Video Segmentation by Gated Recurrent Flow Propagation", "", "Lund University", "Lund University", "TEM at Lund University, 9, Klostergatan, Stadsk\u00e4rnan, Centrum, Lund, Sk\u00e5ne, G\u00f6taland, 22222, Sverige", "55.70395710", "13.19020110", "edu", "", "Sweden", "2016"], ["Swap Retrieval: Retrieving Images of Cats When the Query Shows a Dog", "KULeuven, Leuven, Belgium", "KULeuven, Leuven, Belgium", "KULeuven, Leuven, Belgium", "Oude Markt 13, 3000 Leuven, Belgium", "50.87795450", "4.70029530", "edu", "", "Spain", "2015"], ["Maya Codical Glyph Segmentation: A Crowdsourcing Approach", "Idiap Research Institute, and the School of Electrical Engineering, Swiss Federal Institute of Technology in Lausanne (EPFL), Martigny, Switzerland", "IDIAP Research Institute", "IDIAP Research Institute", "Idiap Research Institute, Parking Centre du parc, Martigny, Valais/Wallis, 1920, Schweiz/Suisse/Svizzera/Svizra", "46.10923700", "7.08453549", "edu", "", "Switzerland", "2018"], ["Deep Learning for Classification of Colorectal Polyps on Whole-slide Images", "", "Dartmouth College", "Dartmouth College", "Dartmouth College, Tuck Mall, Hanover, Grafton County, New Hampshire, 03755, USA", "43.70479270", "-72.29259090", "edu", "", "United States", "2017"], ["VCI 2 R at the NTCIR-13 Lifelog-2 Lifelog Semantic Access Task", "", "Singapore", "Singapore", "Singapore", "1.35208300", "103.81983600", "edu", "", "Singapore", "2017"], ["Survey on the attention based RNN model and its applications in computer vision", "", "Delft University of Technology", "Delft University of Technology", "TU Delft, Mekelweg, TU-wijk, Delft, Zuid-Holland, Nederland, 2628, Nederland", "51.99882735", "4.37396037", "edu", "", "Netherlands", "2016"], ["Scalable, High-Quality Object Detection", "", "University of Michigan", "University of Michigan", "University of Michigan, 500, Hayward Street, Ann Arbor, Washtenaw County, Michigan, 48109, USA", "42.29421420", "-83.71003894", "edu", "", "United States", "2014"], ["An Integral Pose Regression System for the ECCV2018 PoseTrack Challenge", "", "Zhejiang University", "Zhejiang University", "\u6d59\u6c5f\u5927\u5b66\u4e4b\u6c5f\u6821\u533a, \u4e4b\u6c5f\u8def, \u8f6c\u5858\u8857\u9053, \u897f\u6e56\u533a (Xihu), \u676d\u5dde\u5e02 Hangzhou, \u6d59\u6c5f\u7701, 310008, \u4e2d\u56fd", "30.19331415", "120.11930822", "edu", "", "China", "2018"], ["ON GENERIC OBJECT RECOGNITION TECHNIQUES : CHALLENGES AND OPPORTUNITIES Prof", "", "India", "India", "India", "20.59368400", "78.96288000", "edu", "", "", ""], ["Joint Flow: Temporal Flow Fields for Multi Person Tracking", "", "University of Bonn", "University of Bonn", "Rheinische Friedrich-Wilhelms-Universit\u00e4t Bonn, Arkadenhof, Bonn-Zentrum, Stadtbezirk Bonn, Bonn, Regierungsbezirk K\u00f6ln, Nordrhein-Westfalen, 53113, Deutschland", "50.73381240", "7.10224650", "edu", "", "Germany", "2018"], ["Snuba: Automating Weak Supervision to Label Training Data", "", "Stanford University", "Stanford University", "Stanford University, Memorial Way, Stanford, Santa Clara County, California, 94305-6015, USA", "37.43131385", "-122.16936535", "edu", "", "United States", "2018"], ["A 2 A : Attention to Attention Reasoning for Movie Question Answering", "", "Institute of Information Science", "Institute of Information Science", "\u8cc7\u8a0a\u79d1\u5b78\u7814\u7a76\u6240, \u6578\u7406\u5927\u9053, \u4e2d\u7814\u91cc, \u5357\u6e2f\u5b50, \u5357\u6e2f\u5340, \u81fa\u5317\u5e02, 11574, \u81fa\u7063", "25.04107280", "121.61475620", "edu", "", "Taiwan", "2018"], ["Anchor Box Optimization for Object Detection", "", "Microsoft", "Microsoft Corporation, Redmond, WA, USA", "One Microsoft Way, Redmond, WA 98052, USA", "47.64233180", "-122.13693020", "company", "", "United States", "2018"], ["Learning Representation for Scene Understanding: Epitomes, CRFs, and CNNs", "", "University of California", "University of California", "Berkeley, CA, USA", "37.87189920", "-122.25853990", "edu", "", "United States", "2015"], ["Taskonomy: Disentangling Task Transfer Learning", "", "University of California, Berkeley", "University of California, Berkeley", "Berkeley Art Museum and Pacific Film Archive, Bancroft Way, Southside, Berkeley, Alameda County, California, 94720-1076, USA", "37.86871260", "-122.25586815", "edu", "", "United States", "2018"], ["Multi-scale Location-Aware Kernel Representation for Object Detection", "", "Dalian University of Technology", "Dalian University of Technology", "\u5927\u8fde\u7406\u5de5\u5927\u5b66, \u7ea2\u51cc\u8def, \u7518\u4e95\u5b50\u533a, \u51cc\u6c34\u9547, \u7518\u4e95\u5b50\u533a / Ganjingzi, \u5927\u8fde\u5e02 / Dalian, \u8fbd\u5b81\u7701, 116023, \u4e2d\u56fd", "38.88140235", "121.52281098", "edu", "", "China", "2018"], ["Jointly Discovering Visual Objects and Spoken Words from Raw Sensory Input", "", "MIT", "Massachusetts Institute", "MIT, Amherst Street, Cambridgeport, Cambridge, Middlesex County, Massachusetts, 02238, USA", "42.35839610", "-71.09567788", "edu", "", "United States", "2018"], ["Who Are Raising Their Hands ? Hand-Raiser Seeking Based on Object Detection and Pose Estimation", "", "Shanghai Jiao Tong University", "Shanghai Jiao Tong University", "\u4e0a\u6d77\u4ea4\u901a\u5927\u5b66\uff08\u5f90\u6c47\u6821\u533a\uff09, \u6dee\u6d77\u897f\u8def, \u756a\u79ba\u5c0f\u533a, \u5e73\u9634\u6865, \u5f90\u6c47\u533a, \u4e0a\u6d77\u5e02, 200052, \u4e2d\u56fd", "31.20081505", "121.42840681", "edu", "", "China", "2018"], ["Robust Adversarial Perturbation on Deep Proposal-based Models", "", "GE Global Research Center", "GE Global Research Center", "GE Global Research Center, Aqueduct, Niskayuna, Schenectady County, New York, USA", "42.82982480", "-73.87719385", "edu", "", "United States", "2018"], ["Cross-Dataset Adaptation for Visual Question Answering", "", "University of Southern California", "University of Southern California", "University of Southern California, Watt Way, Saint James Park, LA, Los Angeles County, California, 90089, USA", "34.02241490", "-118.28634407", "edu", "", "United States", "2018"], ["Grounded Objects and Interactions for Video Captioning", "", "Georgia Institute of Technology", "Georgia Institute of Technology", "Georgia Tech, Atlantic Drive Northwest, Bellwood, Rockdale, Atlanta, Fulton County, Georgia, 30318, USA", "33.77603300", "-84.39884086", "edu", "", "United States", "2017"], ["Priming Neural Networks", "", "York University", "York University", "York University, Keele Campus, Campus Walk, North York, Toronto, Ontario, M3J 2S5, Canada", "43.77439110", "-79.50481085", "edu", "", "Canada", "2018"], ["Neural Baby Talk", "", "Georgia Institute of Technology", "Georgia Institute of Technology", "Georgia Tech, Atlantic Drive Northwest, Bellwood, Rockdale, Atlanta, Fulton County, Georgia, 30318, USA", "33.77603300", "-84.39884086", "edu", "", "United States", "2018"], ["End-to-End Recovery of Human Shape and Pose", "", "University of California, Berkeley", "University of California, Berkeley", "Berkeley Art Museum and Pacific Film Archive, Bancroft Way, Southside, Berkeley, Alameda County, California, 94720-1076, USA", "37.86871260", "-122.25586815", "edu", "", "United States", "2018"], ["HashNet: Deep Learning to Hash by Continuation", "", "University of Illinois at Chicago", "University of Illinois at Chicago", "University of Illinois at Chicago, West Taylor Street, Greektown, Chicago, Cook County, Illinois, 60607, USA", "41.86898915", "-87.64856256", "edu", "", "United States", "2017"], ["Associative Embedding: End-to-End Learning for Joint Detection and Grouping", "", "University of Michigan", "University of Michigan", "University of Michigan, 500, Hayward Street, Ann Arbor, Washtenaw County, Michigan, 48109, USA", "42.29421420", "-83.71003894", "edu", "", "United States", "2017"], ["Transforming sensor data to the image domain for deep learning \u2014 An application to footstep detection", "", "University of Fribourg", "University of Fribourg", "Avenue de l'Europe 20, 1700 Fribourg, Switzerland", "46.80635700", "7.15200600", "edu", "", "Switzerland", "2017"], ["Towards Deep Cellular Phenotyping in Placental Histology", "", "University of Oxford", "University of Oxford", "Radcliffe Camera, Radcliffe Square, Grandpont, Oxford, Oxon, South East, England, OX1 4AJ, UK", "51.75345380", "-1.25400997", "edu", "", "United Kingdom", "2018"], ["People and Vehicles in Danger - A Fire and Flood Detection System in Social Media", "CERTH-ITI, Thessaloniki, Greece", "CERTH-ITI, Thessaloniki, Greece", "CERTH-ITI, Thessaloniki, Greece", "Thermi 570 01, Greece", "40.56676110", "22.99801470", "edu", "", "Greece", "2018"], ["Personalized Serious Games for Cognitive Intervention with Lifelog Visual Analytics", "Singapore Bioimaging Consortium, A*STAR, Singapore, Singapore", "Singapore Bioimaging Consortium, A*STAR, Singapore, Singapore", "Singapore Bioimaging Consortium, A*STAR, Singapore, Singapore", "11 Biopolis Way, Singapore 138667", "1.30452010", "103.79165150", "edu", "", "Singapore", "2018"], ["From UI Design Image to GUI Skeleton: A Neural Machine Translator to Bootstrap Mobile GUI Implementation", "Nanyang Technological University, Singapore", "Nanyang Technological University", "Nanyang Technological University", "NTU, Faculty Avenue, Jurong West, Southwest, 637460, Singapore", "1.34841040", "103.68297965", "edu", "", "Singapore", "2018"], ["Selective Refinement Network for High Performance Face Detection", "", "University of Chinese Academy of Sciences", "University of Chinese Academy of Sciences", "University of Chinese Academy of Sciences, UCAS, Yuquanlu, \u7389\u6cc9\u8def, \u7530\u6751, \u6d77\u6dc0\u533a, 100049, \u4e2d\u56fd", "39.90828040", "116.24585270", "edu", "", "China", "2018"], ["Describing Common Human Visual Actions in Images", "", "California Institute of Technology", "California Institute of Technology", "California Institute of Technology, San Pasqual Walk, Madison Heights, Pasadena, Los Angeles County, California, 91126, USA", "34.13710185", "-118.12527487", "edu", "", "United States", "2015"], ["Person Retrieval in Surveillance Video using Height, Color and Gender", "", "India", "India", "India", "20.59368400", "78.96288000", "edu", "", "", "2018"], ["A Robot Localization Framework Using CNNs for Object Detection and Pose Estimation", "", "Otto von Guericke University", "Otto von Guericke University", "Otto-von-Guericke-Universit\u00e4t Magdeburg, 2, Universit\u00e4tsplatz, Kr\u00f6kentorviertel/Breiter Weg NA, Alte Neustadt, Magdeburg, Sachsen-Anhalt, 39106, Deutschland", "52.14005065", "11.64471248", "edu", "", "Germany", "2018"], ["Automatic Concept Discovery from Parallel Text and Visual Corpora", "", "Tsinghua University", "Tsinghua University", "\u6e05\u534e\u5927\u5b66, 30, \u53cc\u6e05\u8def, \u4e94\u9053\u53e3, \u540e\u516b\u5bb6, \u6d77\u6dc0\u533a, 100084, \u4e2d\u56fd", "40.00229045", "116.32098908", "edu", "", "China", "2015"], ["Image Captioning With Visual-Semantic Double Attention", "School of Electronics and Information Technology, Sun Yat-Sen University, Guangdong, People's Republic of China", "Sun Yat-Sen University", "Sun Yat-Sen University", "\u4e2d\u5927, \u65b0\u6e2f\u897f\u8def, \u9f99\u8239\u6ed8, \u5eb7\u4e50, \u6d77\u73e0\u533a (Haizhu), \u5e7f\u5dde\u5e02, \u5e7f\u4e1c\u7701, 510105, \u4e2d\u56fd", "23.09461185", "113.28788994", "edu", "", "China", "2019"], ["Understanding Fake Faces", "", "Waseda University", "Waseda University", "\u65e9\u7a32\u7530\u5927\u5b66 \u5317\u4e5d\u5dde\u30ad\u30e3\u30f3\u30d1\u30b9, 2-2, \u6709\u6bdb\u5f15\u91ce\u7dda, \u516b\u5e61\u897f\u533a, \u5317\u4e5d\u5dde\u5e02, \u798f\u5ca1\u770c, \u4e5d\u5dde\u5730\u65b9, 808-0135, \u65e5\u672c", "33.88987280", "130.70856205", "edu", "", "Japan", "2018"], ["SketchyScene: Richly-Annotated Scene Sketches", "", "Simon Fraser University", "Simon Fraser University", "SFU Burnaby, South Campus Road, Barnet, Burnaby, Metro Vancouver, British Columbia, V5A 4X6, Canada", "49.27674540", "-122.91777375", "edu", "", "Canada", "2018"], ["Much Ado About Time: Exhaustive Annotation of Temporal Data", "", "Carnegie Mellon University", "Carnegie Mellon University", "Carnegie Mellon University Silicon Valley, South Akron Road, ARC, Santa Clara County, California, 94035-0016, USA", "37.41021930", "-122.05965487", "edu", "", "United States", "2016"], ["Mainstream: Dynamic Stem-Sharing for Multi-Tenant Video Processing", "", "Carnegie Mellon University", "Carnegie Mellon University", "Carnegie Mellon University Silicon Valley, South Akron Road, ARC, Santa Clara County, California, 94035-0016, USA", "37.41021930", "-122.05965487", "edu", "", "United States", "2018"], ["A Multi-Oriented Scene Text Detector with Position-Sensitive Segmentation", "University of Chinese Academy of Sciences, Beijing, China", "University of Chinese Academy of Sciences", "University of Chinese Academy of Sciences", "University of Chinese Academy of Sciences, UCAS, Yuquanlu, \u7389\u6cc9\u8def, \u7530\u6751, \u6d77\u6dc0\u533a, 100049, \u4e2d\u56fd", "39.90828040", "116.24585270", "edu", "", "China", "2018"], ["Simple Baselines for Human Pose Estimation and Tracking", "", "University of Electronic Science and Technology of China", "University of Electronic Science and Technology of China", "Columbus, OH 43210, USA", "40.01419050", "-83.03091430", "edu", "", "United States", "2018"], ["Image describing based on bidirectional LSTM and improved sequence sampling", "College of Computer Science. Chongqing University, Chongqing, China", "Chongqing University", "Chongqing University", "\u91cd\u5e86\u5de5\u5546\u5927\u5b66, 19, \u7fe0\u6797\u8def, \u91cd\u5e86\u5e02, \u91cd\u5e86\u5e02\u4e2d\u5fc3, \u5357\u5cb8\u533a (Nan'an), \u91cd\u5e86\u5e02, 400067, \u4e2d\u56fd", "29.50841740", "106.57858552", "edu", "", "China", "2017"], ["Learning from PhotoShop Operation Videos : the PSOV Dataset", "", "University of California", "University of California", "Berkeley, CA, USA", "37.87189920", "-122.25853990", "edu", "", "United States", "2018"], ["Deep conditional neural network for image segmentation", "Department of Computing, The Hong Kong Polytechnic University", "Hong Kong Polytechnic University", "Hong Kong Polytechnic University", "hong kong, 11, \u80b2\u624d\u9053 Yuk Choi Road, \u5c16\u6c99\u5480 Tsim Sha Tsui, \u6cb9\u5c16\u65fa\u5340 Yau Tsim Mong District, \u4e5d\u9f8d Kowloon, HK, 00000, \u4e2d\u56fd", "22.30457200", "114.17976285", "edu", "", "China", "2016"], ["Human Centred Object Co-Segmentation", "", "Stanford University", "Stanford University", "Stanford University, Memorial Way, Stanford, Santa Clara County, California, 94305-6015, USA", "37.43131385", "-122.16936535", "edu", "", "United States", "2016"], ["Image Captioning with both Object and Scene Information", "Institute of Computing Technology, Chinese Academy of Sciences, Beijing, China", "Chinese Academy of Sciences", "Chinese Academy of Sciences", "\u4e2d\u56fd\u79d1\u5b66\u9662\u5fc3\u7406\u7814\u7a76\u6240, 16, \u6797\u8403\u8def, \u671d\u9633\u533a / Chaoyang, \u5317\u4eac\u5e02, 100101, \u4e2d\u56fd", "40.00447950", "116.37023800", "edu", "", "China", "2016"], ["SuperNeurons: FFT-based Gradient Sparsification in the Distributed Training of Deep Neural Networks", "", "Brown University", "Brown University", "Brown University, Waterman Street, College Hill, Providence, Bristol, Rhode Island, 02912, USA", "41.82686820", "-71.40123146", "edu", "", "United States", "2018"], ["A Data Driven Approach for Compound Figure Separation Using Convolutional Neural Networks", "", "Indiana University", "Indiana University", "Indiana University East, West Cart Road, Richmond, Wayne County, Indiana, 47374, USA", "39.86948105", "-84.87956905", "edu", "", "United States", "2017"], ["Intention Oriented Image Captions with Guiding Objects", "", "Tsinghua University", "Tsinghua University", "\u6e05\u534e\u5927\u5b66, 30, \u53cc\u6e05\u8def, \u4e94\u9053\u53e3, \u540e\u516b\u5bb6, \u6d77\u6dc0\u533a, 100084, \u4e2d\u56fd", "40.00229045", "116.32098908", "edu", "", "China", "2018"], ["Aligning Books and Movies: Towards Story-Like Visual Explanations by Watching Movies and Reading Books", "", "MIT", "Massachusetts Institute", "MIT, Amherst Street, Cambridgeport, Cambridge, Middlesex County, Massachusetts, 02238, USA", "42.35839610", "-71.09567788", "edu", "", "United States", "2015"], ["Multi-scale Patch Aggregation (MPA) for Simultaneous Detection and Segmentation", "", "Chinese University of Hong Kong", "Chinese University of Hong Kong", "Hong Kong, \u99ac\u6599\u6c34\u6c60\u65c1\u8def", "22.41626320", "114.21093180", "edu", "", "China", "2016"], ["Interpretable Explanations of Black Boxes by Meaningful Perturbation", "", "University of Oxford", "University of Oxford", "Radcliffe Camera, Radcliffe Square, Grandpont, Oxford, Oxon, South East, England, OX1 4AJ, UK", "51.75345380", "-1.25400997", "edu", "", "United Kingdom", "2017"], ["A Restricted Visual Turing Test for Deep Scene and Event Understanding", "", "University of California, Los Angeles", "University of California, Los Angeles", "200 UCLA, Medical Plaza Driveway Suite 540, Los Angeles, CA 90095, USA", "34.06877880", "-118.44500940", "edu", "", "United States", "2015"], ["Euphrates: Algorithm-SoC Co-Design for Low-Power Mobile Continuous Vision", "", "Georgia Institute of Technology", "Georgia Institute of Technology", "Georgia Tech, Atlantic Drive Northwest, Bellwood, Rockdale, Atlanta, Fulton County, Georgia, 30318, USA", "33.77603300", "-84.39884086", "edu", "", "United States", "2018"], ["Similarity Reasoning over Semantic Context\u2013graphs", "", "Brown University", "Brown University", "Brown University, Waterman Street, College Hill, Providence, Bristol, Rhode Island, 02912, USA", "41.82686820", "-71.40123146", "edu", "", "United States", "2015"], ["Multimodal Differential Network for Visual Question Generation", "", "Indian Institute of Technology Delhi", "IIIT-Delhi, India", "IIIT-Delhi, Mathura Road, Friends Colony, South East Delhi, Delhi, 110020, India", "28.54632595", "77.27325504", "edu", "", "India", "2018"], ["Learning Spatial Regularization with Image-Level Supervisions for Multi-label Image Classification", "", "University of Sydney", "University of Sydney", "USyd, Fisher Road, Camperdown, Sydney, NSW, 2006, Australia", "-33.88890695", "151.18943366", "edu", "", "Australia", "2017"], ["Visual Question Reasoning on General Dependency Tree", "", "Sun Yat-Sen University", "Sun Yat-Sen University", "\u4e2d\u5927, \u65b0\u6e2f\u897f\u8def, \u9f99\u8239\u6ed8, \u5eb7\u4e50, \u6d77\u73e0\u533a (Haizhu), \u5e7f\u5dde\u5e02, \u5e7f\u4e1c\u7701, 510105, \u4e2d\u56fd", "23.09461185", "113.28788994", "edu", "", "China", "2018"], ["Interactive Demonstration of Probabilistic Predicates", "University of Washington &Microsoft, Seattle, WA, USA", "University of Washington", "University of Washington", "University of Washington, Rainier Vista, Montlake, University District, Seattle, King County, Washington, 98195, USA", "47.65432380", "-122.30800894", "edu", "", "United States", "2018"], ["A Dataset and Exploration of Models for Understanding Video Data through Fill-in-the-Blank Question-Answering", "", "Polytechnique Montreal", "Polytechnique Montr\u00b4eal", "2900 Boulevard Edouard-Montpetit, Montr\u00e9al, QC H3T 1J4, Canada", "45.50438400", "-73.61288290", "edu", "Polytechnique Montreal, Montreal, Quebec, Canada", "Canada", "2017"], ["Are You Talking to Me? Reasoned Visual Dialog Generation Through Adversarial Learning", "", "Northwestern Polytechnical University", "Northwestern Polytechnical University", "\u897f\u5317\u5de5\u4e1a\u5927\u5b66 \u53cb\u8c0a\u6821\u533a, 127\u53f7, \u53cb\u8c0a\u897f\u8def, \u957f\u5b89\u8def, \u7891\u6797\u533a (Beilin), \u897f\u5b89\u5e02, \u9655\u897f\u7701, 710072, \u4e2d\u56fd", "34.24691520", "108.91061982", "edu", "", "China", "2018"], ["MovieQA: Understanding Stories in Movies through Question-Answering", "", "Karlsruhe Institute of Technology", "Karlsruhe Institute of Technology", "KIT, Leopoldshafener Allee, Linkenheim, Linkenheim-Hochstetten, Landkreis Karlsruhe, Regierungsbezirk Karlsruhe, Baden-W\u00fcrttemberg, 76351, Deutschland", "49.10184375", "8.43312560", "edu", "", "Germany", "2016"], ["ReDMark: Framework for Residual Diffusion Watermarking on Deep Networks", "", "University of Queensland", "University of Queensland", "University of Queensland, University Drive, Hill End, St Lucia, Brisbane, QLD, 4072, Australia", "-27.49741805", "153.01316956", "edu", "", "Australia", "2018"], ["Transitive Invariance for Self-Supervised Visual Representation Learning", "", "Carnegie Mellon University", "Carnegie Mellon University", "Carnegie Mellon University Silicon Valley, South Akron Road, ARC, Santa Clara County, California, 94035-0016, USA", "37.41021930", "-122.05965487", "edu", "", "United States", "2017"], ["Using Segmentation to Predict the Absence of Occluded Parts", "", "University of California", "University of California", "Berkeley, CA, USA", "37.87189920", "-122.25853990", "edu", "", "United States", "2015"], ["LabelBank: Revisiting Global Perspectives for Semantic Segmentation", "", "Simon Fraser University", "Simon Fraser University", "SFU Burnaby, South Campus Road, Barnet, Burnaby, Metro Vancouver, British Columbia, V5A 4X6, Canada", "49.27674540", "-122.91777375", "edu", "", "Canada", "2017"], ["Application of a Hybrid Model Based on a Convolutional Auto-Encoder and Convolutional Neural Network in Object-Oriented Remote Sensing Classification", "", "Wuhan University of Technology", "Wuhan University of Technology", "\u6b66\u6c49\u7406\u5de5\u5927\u5b66-\u4f59\u5bb6\u5934\u6821\u533a, \u4ea4\u901a\u4e8c\u8def, \u6768\u56ed\u8857\u9053, \u6b66\u660c\u533a (Wuchang), \u6b66\u6c49\u5e02, \u6e56\u5317\u7701, 430062, \u4e2d\u56fd", "30.60903415", "114.35142840", "edu", "", "China", "2018"], ["Visual Storytelling", "", "Virginia Tech", "Virginia Tech", "Blacksburg, VA 24061, USA", "37.22838430", "-80.42341670", "edu", "", "United States", "2016"], ["Boundary aware image segmentation with unsupervised mixture models", "Image Analysis Group, Technical University Dortmund, Otto-Hahn-Str. 4, 44227 Dortmund, Germany", "Technical University Dortmund", "Image Analysis Group, Technical University Dortmund, Otto-Hahn-Str. 4, 44227 Dortmund, Germany", "Emil-Figge-Stra\u00dfe 50, 44227 Dortmund, Germany", "51.49219020", "7.41413620", "edu", "", "Germany", "2017"], ["Edge-Cloud Collaborative Processing for Intelligent Internet of Things: A Case Study on Smart Surveillance", "Georgia Institute of Technology", "Georgia Institute of Technology", "Georgia Institute of Technology", "Georgia Tech, Atlantic Drive Northwest, Bellwood, Rockdale, Atlanta, Fulton County, Georgia, 30318, USA", "33.77603300", "-84.39884086", "edu", "", "United States", "2018"], ["Uncovering the Temporal Context for Video Question Answering", "SCS, Carnegie Mellon University, Pittsburgh, USA", "Carnegie Mellon University", "Carnegie Mellon University", "Carnegie Mellon University Silicon Valley, South Akron Road, ARC, Santa Clara County, California, 94035-0016, USA", "37.41021930", "-122.05965487", "edu", "", "United States", "2017"], ["Inside-Outside Net: Detecting Objects in Context with Skip Pooling and Recurrent Neural Networks", "", "Cornell University", "Cornell University", "Cornell University, Forest Home Drive, Forest Home, Tompkins County, New York, 14853, USA", "42.45055070", "-76.47835130", "edu", "", "United States", "2016"], ["Deep learning-based human head detection and extraction for robotic portrait drawing", "Shenzhen Academy of Robotics, Shenzhen, Guangdong, China", "Shenzhen Academy of Robotics, Shenzhen, Guangdong, China", "Shenzhen Academy of Robotics, Shenzhen, Guangdong, China", "Shenzhen, Guangdong, China", "22.54309600", "114.05786500", "edu", "", "China", "2017"], ["On the Origin of Deep Learning On the Origin of Deep Learning", "", "Carnegie Mellon University", "Carnegie Mellon University", "Carnegie Mellon University Silicon Valley, South Akron Road, ARC, Santa Clara County, California, 94035-0016, USA", "37.41021930", "-122.05965487", "edu", "", "United States", "2017"], ["A survey on deep neural network-based image captioning", "School of Mechanical, Electrical and Information Engineering, Shandong University, Weihai, People\u2019s Republic of China", "Shandong University", "Shandong University", "\u5c71\u4e1c\u5927\u5b66, \u6cf0\u5b89\u8857, \u9ccc\u5c71\u536b\u8857\u9053, \u5373\u58a8\u533a, \u9752\u5c9b\u5e02, \u5c71\u4e1c\u7701, 266200, \u4e2d\u56fd", "36.36934730", "120.67381800", "edu", "", "China", "2018"], ["Leveraging Visual Question Answering for Image-Caption Ranking", "", "Virginia Tech", "Virginia Tech", "Blacksburg, VA 24061, USA", "37.22838430", "-80.42341670", "edu", "", "United States", "2016"], ["An object based graph representation for video comparison", "Dept. of Electrical and Computer Engineering, NYU Tandon School of Engineering, New York, USA", "Chongqing University of Technology", "Chongqing University of Technology, China", "69 Hongguang Ave, Banan Qu, Chongqing Shi, China", "29.45832600", "106.52994700", "edu", "", "China", "2017"], ["Phrase Localization and Visual Relationship Detection with Comprehensive Image-Language Cues", "", "University of Illinois, Urbana-Champaign", "University of Illinois, Urbana-Champaign", "B-3, South Mathews Avenue, Urbana, Champaign County, Illinois, 61801, USA", "40.11116745", "-88.22587665", "edu", "", "United States", "2017"], ["Deep image representations using caption generators", "", "Indian Institute of Science Bangalore", "Indian Institute of Science Bangalore", "IISc, Gulmohar Marg, RMV Stage II - 1st Block, Aramane Nagara Ward, West Zone, Bengaluru, Bangalore Urban, Karnataka, 560012, India", "13.02223470", "77.56718325", "edu", "", "India", "2017"], ["Convolution Neural Networks With Two Pathways for Image Style Recognition", "Institute for Interdisciplinary Information Sciences, Tsinghua University, Beijing, China", "Tsinghua University", "Tsinghua University", "\u6e05\u534e\u5927\u5b66, 30, \u53cc\u6e05\u8def, \u4e94\u9053\u53e3, \u540e\u516b\u5bb6, \u6d77\u6dc0\u533a, 100084, \u4e2d\u56fd", "40.00229045", "116.32098908", "edu", "", "China", "2017"], ["Natural Language Object Retrieval", "", "University of Massachusetts", "University of Massachusetts", "University of Massachusetts, Hicks Way, Amherst, Hampshire, Massachusetts, 01003, USA", "42.38897850", "-72.52869870", "edu", "", "United States", "2016"], ["Watch and learn: Semi-supervised learning of object detectors from videos", "", "Robotics Institute", "Robotics Institute", "Institute for Field Robotics, \u0e1b\u0e23\u0e30\u0e0a\u0e32\u0e2d\u0e38\u0e17\u0e34\u0e28, \u0e01\u0e23\u0e38\u0e07\u0e40\u0e17\u0e1e\u0e21\u0e2b\u0e32\u0e19\u0e04\u0e23, \u0e40\u0e02\u0e15\u0e23\u0e32\u0e29\u0e0e\u0e23\u0e4c\u0e1a\u0e39\u0e23\u0e13\u0e30, \u0e01\u0e23\u0e38\u0e07\u0e40\u0e17\u0e1e\u0e21\u0e2b\u0e32\u0e19\u0e04\u0e23, 10140, \u0e1b\u0e23\u0e30\u0e40\u0e17\u0e28\u0e44\u0e17\u0e22", "13.65450525", "100.49423171", "edu", "", "Thailand", "2015"], ["Advanced Deep-Learning Techniques for Salient and Category-Specific Object Detection: A Survey", "Northwestern Polytechnical University, Xi'an, 710072, China", "Northwestern Polytechnical University", "Northwestern Polytechnical University", "\u897f\u5317\u5de5\u4e1a\u5927\u5b66 \u53cb\u8c0a\u6821\u533a, 127\u53f7, \u53cb\u8c0a\u897f\u8def, \u957f\u5b89\u8def, \u7891\u6797\u533a (Beilin), \u897f\u5b89\u5e02, \u9655\u897f\u7701, 710072, \u4e2d\u56fd", "34.24691520", "108.91061982", "edu", "", "China", "2018"], ["Word Prior Detection Segmentation Input \" The left guy \" Image : Query : a guy left the youth Energy", "", "IBM Thomas J. Watson Research Center", "IBM Thomas J. Watson Research Center", "IBM Yorktown research lab, Adams Road, Millwood, Town of New Castle, Westchester County, New York, 10562, USA", "41.21002475", "-73.80407056", "company", "", "United States", "2017"], ["Image Caption with Synchronous Cross-Attention", "Beijing University of Posts and Telecommunications, Beijing, China", "Beijing University of Posts and Telecommunications", "Beijing University of Posts and Telecommunications", "\u5317\u4eac\u90ae\u7535\u5927\u5b66, \u897f\u571f\u57ce\u8def, \u6d77\u6dc0\u533a, \u5317\u4eac\u5e02, 100082, \u4e2d\u56fd", "39.96014880", "116.35193921", "edu", "", "China", "2017"], ["Exploring confusing scene classes for the places dataset: Insights and solutions", "Department of Electrical Engineering, University of Southern California, Los Angeles, CA 90089, U.S.A.", "University of Southern California", "University of Southern California", "University of Southern California, Watt Way, Saint James Park, LA, Los Angeles County, California, 90089, USA", "34.02241490", "-118.28634407", "edu", "", "United States", "2017"], ["Adversarial Ranking for Language Generation", "", "University of Washington", "University of Washington", "University of Washington, Rainier Vista, Montlake, University District, Seattle, King County, Washington, 98195, USA", "47.65432380", "-122.30800894", "edu", "", "United States", "2017"], ["3D-SSD: Learning Hierarchical Features from RGB-D Images for Amodal 3D Object Detection", "", "Zhejiang University", "Zhejiang University", "\u6d59\u6c5f\u5927\u5b66\u4e4b\u6c5f\u6821\u533a, \u4e4b\u6c5f\u8def, \u8f6c\u5858\u8857\u9053, \u897f\u6e56\u533a (Xihu), \u676d\u5dde\u5e02 Hangzhou, \u6d59\u6c5f\u7701, 310008, \u4e2d\u56fd", "30.19331415", "120.11930822", "edu", "", "China", "2017"], ["Neuron-level Selective Context Aggregation for Scene Segmentation", "", "Shandong University", "Shandong University", "\u5c71\u4e1c\u5927\u5b66, \u6cf0\u5b89\u8857, \u9ccc\u5c71\u536b\u8857\u9053, \u5373\u58a8\u533a, \u9752\u5c9b\u5e02, \u5c71\u4e1c\u7701, 266200, \u4e2d\u56fd", "36.36934730", "120.67381800", "edu", "", "China", "2017"], ["Factors Influencing The Performance of Image Captioning Model: An Evaluation", "SoICT, HUST and School of Information and Communication Technology, Hanoi University of Science and Technology, Hanoi, Vietnam", "Hanoi University of Science and Technology", "Hanoi University of Science and Technology", "HUST, Tr\u1ea7n \u0110\u1ea1i Ngh\u0129a, Hai B\u00e0 Tr\u01b0ng, H\u00e0 N\u1ed9i, 10999, Vietnam", "21.00395200", "105.84360183", "edu", "", "Vietnam", "2016"], ["Accurate License Plate Recognition and Super-Resolution Using a Generative Adversarial Networks on Traffic Surveillance Video", "Gwangju Institute of Science and Technology", "Gwangju Institute of Science and Technology", "Gwangju Institute of Science and Technology", "123 Cheomdangwagi-ro, Oryong-dong, Buk-gu, Kwangju, South Korea", "35.22652880", "126.83998700", "edu", "", "", "2018"], ["Progressive Neural Architecture Search", "", "Stanford University", "Stanford University", "Stanford University, Memorial Way, Stanford, Santa Clara County, California, 94305-6015, USA", "37.43131385", "-122.16936535", "edu", "", "United States", "2018"], ["Beyond Domain Adaptation: Unseen Domain Encapsulation via Universal Non-volume Preserving Models", "", "University of Illinois, Urbana-Champaign", "University of Illinois, Urbana-Champaign", "B-3, South Mathews Avenue, Urbana, Champaign County, Illinois, 61801, USA", "40.11116745", "-88.22587665", "edu", "", "United States", "2018"], ["From Known to the Unknown: Transferring Knowledge to Answer Questions about Novel Visual and Semantic Concepts", "", "Australian National University", "Australian National University", "Canberra ACT 0200, Australia", "-35.27769990", "149.11852700", "edu", "", "Australia", "2018"], ["Weakly Supervised Salient Object Detection Using Image Labels", "", "SenseTime", "SenseTime", "China, Beijing Shi, Haidian Qu, WuDaoKou, Zhongguancun E Rd, 1\u53f7-7", "39.99300800", "116.32988200", "company", "1 Zhongguancun E Rd, Haidian Qu, China", "China", "2018"], ["Reducing Network Agnostophobia", "", "University of Colorado, Colorado Springs", "University of Colorado Colorado Springs", "Main Hall, The Spine, Colorado Springs, El Paso County, Colorado, 80907, USA", "38.89207560", "-104.79716389", "edu", "", "United States", "2018"], ["DistInit: Learning Video Representations without a Single Labeled Video", "", "Carnegie Mellon University", "Carnegie Mellon University", "Carnegie Mellon University Silicon Valley, South Akron Road, ARC, Santa Clara County, California, 94035-0016, USA", "37.41021930", "-122.05965487", "edu", "", "United States", "2019"], ["Image2song: Song Retrieval via Bridging Image Content and Lyric Words", "", "Northwestern Polytechnical University", "Northwestern Polytechnical University", "\u897f\u5317\u5de5\u4e1a\u5927\u5b66 \u53cb\u8c0a\u6821\u533a, 127\u53f7, \u53cb\u8c0a\u897f\u8def, \u957f\u5b89\u8def, \u7891\u6797\u533a (Beilin), \u897f\u5b89\u5e02, \u9655\u897f\u7701, 710072, \u4e2d\u56fd", "34.24691520", "108.91061982", "edu", "", "China", "2017"], ["Exploring Person Context and Local Scene Context for Object Detection.", "", "University of California, Berkeley", "University of California, Berkeley", "Berkeley Art Museum and Pacific Film Archive, Bancroft Way, Southside, Berkeley, Alameda County, California, 94720-1076, USA", "37.86871260", "-122.25586815", "edu", "", "United States", "2015"], ["An efficient framework for learning sentence representations", "", "University of Michigan", "University of Michigan", "University of Michigan, 500, Hayward Street, Ann Arbor, Washtenaw County, Michigan, 48109, USA", "42.29421420", "-83.71003894", "edu", "", "United States", "2018"], ["Semantic Correspondence: A Hierarchical Approach", "", "Queensland University of Technology", "Queensland University of Technology", "Queensland University of Technology, Macgregor Lane, Merthyr, South Brisbane, Brisbane, QLD, 4000, Australia", "-27.47715625", "153.02841004", "edu", "", "Australia", "2018"], ["Contextual Memory Trees", "", "Microsoft", "Microsoft Corporation, Redmond, WA, USA", "One Microsoft Way, Redmond, WA 98052, USA", "47.64233180", "-122.13693020", "company", "", "United States", "2018"], ["Object Referring in Videos with Language and Human Gaze", "", "ETH Zurich", "ETH Zurich", "R\u00e4mistrasse 101, 8092 Z\u00fcrich, Switzerland", "47.37631300", "8.54766990", "edu", "", "Switzerland", "2018"], ["Adding object detection skills to visual dialogue agents", "", "University of Amsterdam", "University of Amsterdam", "Institute for Logic, Language and Computation (ILLC), 107, Science Park, Oost-Watergraafsmeer, Amsterdam, Oost, Amsterdam, Noord-Holland, Nederland, 1098XG, Nederland", "52.35536550", "4.95016440", "edu", "", "Netherlands", "2018"], ["Generate, Segment and Replace: Towards Generic Manipulation Segmentation.", "", "University of Maryland", "University of Maryland", "The Grand Garage, 5, North Paca Street, Seton Hill, Baltimore, Maryland, 21201, USA", "39.28996850", "-76.62196103", "edu", "", "United States", "2018"], ["Grasp2Vec: Learning Object Representations from Self-Supervised Grasping", "", "University of California, Berkeley", "University of California, Berkeley", "Berkeley Art Museum and Pacific Film Archive, Bancroft Way, Southside, Berkeley, Alameda County, California, 94720-1076, USA", "37.86871260", "-122.25586815", "edu", "", "United States", "2018"], ["Self-view Grounding Given a Narrated 360{\\deg} Video", "", "Microsoft Research Asia", "Microsoft Research Asia", "1 Memorial Dr, Cambridge, MA 02142, USA", "42.36142560", "-71.08120920", "company", "", "United States", "2017"], ["Learning RoI Transformer for Detecting Oriented Objects in Aerial Images", "", "Wuhan University of Technology", "Wuhan University of Technology", "\u6b66\u6c49\u7406\u5de5\u5927\u5b66-\u4f59\u5bb6\u5934\u6821\u533a, \u4ea4\u901a\u4e8c\u8def, \u6768\u56ed\u8857\u9053, \u6b66\u660c\u533a (Wuchang), \u6b66\u6c49\u5e02, \u6e56\u5317\u7701, 430062, \u4e2d\u56fd", "30.60903415", "114.35142840", "edu", "", "China", "2018"], ["Survey of Recent Advances in Visual Question Answering", "", "India", "India", "India", "20.59368400", "78.96288000", "edu", "", "", "2017"], ["Richer Semantic Visual and Language Representation for Video Captioning", "Tongji University, Shanghai, China", "Tongji University", "Tongji University", "\u540c\u6d4e\u5927\u5b66, 1239, \u56db\u5e73\u8def, \u6c5f\u6e7e, \u8679\u53e3\u533a, \u4e0a\u6d77\u5e02, 200092, \u4e2d\u56fd", "31.28473925", "121.49694909", "edu", "", "China", "2017"], ["Touchdown: Natural Language Navigation and Spatial Reasoning in Visual Street Environments", "", "Cornell University", "Cornell University", "Cornell University, Forest Home Drive, Forest Home, Tompkins County, New York, 14853, USA", "42.45055070", "-76.47835130", "edu", "", "United States", "2018"], ["Visual attribute transfer through deep image analogy", "", "Microsoft", "Microsoft Corporation, Redmond, WA, USA", "One Microsoft Way, Redmond, WA 98052, USA", "47.64233180", "-122.13693020", "company", "", "United States", "2017"], ["Towards Improved Design and Evaluation of Epileptic Seizure Predictors", "Mayo Systems Electrophysiology Laboratory, Departments of Neurology and Biomedical EngineeringMayo Clinic", "TU Berlin", "TU Berlin", "Franklinstra\u00dfe 28-29, 10587 Berlin, Germany", "52.51806410", "13.32504250", "edu", "Franklinstr. 28/29, 10587, Germany", "Germany", "2018"], ["PReMVOS: Proposal-generation, Refinement and Merging for Video Object Segmentation", "", "RWTH Aachen University", "RWTH Aachen University", "RWTH Aachen, Mies-van-der-Rohe-Stra\u00dfe, K\u00f6nigsh\u00fcgel, Aachen-Mitte, Aachen, St\u00e4dteregion Aachen, Regierungsbezirk K\u00f6ln, Nordrhein-Westfalen, 52074, Deutschland", "50.77917030", "6.06728733", "edu", "", "Germany", "2018"], ["Explicit Bias Discovery in Visual Question Answering Models", "", "University of Maryland", "University of Maryland", "The Grand Garage, 5, North Paca Street, Seton Hill, Baltimore, Maryland, 21201, USA", "39.28996850", "-76.62196103", "edu", "", "United States", "2018"], ["AUTOMATIC IMAGE ANNOTATION MODEL USING LSTM APPROACH", "", "Varanasi", "Varanasi", "Varanasi, Uttar Pradesh, India", "25.31764520", "82.97391440", "edu", "", "India", "2017"], ["Mo 2 Cap 2 : Real-time Mo bile 3 D Mo tion Cap ture with a Cap-mounted Fisheye Camera", "", "Stanford University", "Stanford University", "Stanford University, Memorial Way, Stanford, Santa Clara County, California, 94305-6015, USA", "37.43131385", "-122.16936535", "edu", "", "United States", "2018"], ["Stroke Controllable Fast Style Transfer with Adaptive Receptive Fields", "", "University of Sydney", "University of Sydney", "USyd, Fisher Road, Camperdown, Sydney, NSW, 2006, Australia", "-33.88890695", "151.18943366", "edu", "", "Australia", "2018"], ["Learning Visually Grounded Sentence Representations", "", "University of California, Berkeley", "University of California, Berkeley", "Berkeley Art Museum and Pacific Film Archive, Bancroft Way, Southside, Berkeley, Alameda County, California, 94720-1076, USA", "37.86871260", "-122.25586815", "edu", "", "United States", "2018"], ["Learning 3 D Scene Synthesis from Annotated RGB-D Images", "", "Zhejiang University", "Zhejiang University", "\u6d59\u6c5f\u5927\u5b66\u4e4b\u6c5f\u6821\u533a, \u4e4b\u6c5f\u8def, \u8f6c\u5858\u8857\u9053, \u897f\u6e56\u533a (Xihu), \u676d\u5dde\u5e02 Hangzhou, \u6d59\u6c5f\u7701, 310008, \u4e2d\u56fd", "30.19331415", "120.11930822", "edu", "", "China", "2016"], ["Bottom-up Pose Estimation of Multiple Person with Bounding Box Constraint", "", "Zhejiang University", "Zhejiang University", "\u6d59\u6c5f\u5927\u5b66\u4e4b\u6c5f\u6821\u533a, \u4e4b\u6c5f\u8def, \u8f6c\u5858\u8857\u9053, \u897f\u6e56\u533a (Xihu), \u676d\u5dde\u5e02 Hangzhou, \u6d59\u6c5f\u7701, 310008, \u4e2d\u56fd", "30.19331415", "120.11930822", "edu", "", "China", "2018"], ["Transferable Interactiveness Prior for Human-Object Interaction Detection", "", "Shanghai Jiao Tong University", "Shanghai Jiao Tong University", "\u4e0a\u6d77\u4ea4\u901a\u5927\u5b66\uff08\u5f90\u6c47\u6821\u533a\uff09, \u6dee\u6d77\u897f\u8def, \u756a\u79ba\u5c0f\u533a, \u5e73\u9634\u6865, \u5f90\u6c47\u533a, \u4e0a\u6d77\u5e02, 200052, \u4e2d\u56fd", "31.20081505", "121.42840681", "edu", "", "China", "2018"], ["A Fully Convolutional Two-Stream Fusion Network for Interactive Image Segmentation", "", "Loughborough University", "Loughborough University", "Computer Science, University Road, Charnwood, Leicestershire, East Midlands, England, LE11 3TP, UK", "52.76635770", "-1.22924610", "edu", "", "United Kingdom", "2019"], ["Corpus Construction and Semantic Analysis of Indonesian Image Description", "", "India", "India", "India", "20.59368400", "78.96288000", "edu", "", "", "2018"], ["A Corpus for Reasoning About Natural Language Grounded in Photographs", "", "University of Maryland", "University of Maryland", "The Grand Garage, 5, North Paca Street, Seton Hill, Baltimore, Maryland, 21201, USA", "39.28996850", "-76.62196103", "edu", "", "United States", "2018"], ["Persuasive Faces: Generating Faces in Advertisements", "", "University of Pittsburgh", "University of Pittsburgh", "University of Pittsburgh, Sutherland Drive, West Oakland, PGH, Allegheny County, Pennsylvania, 15240, USA", "40.44415295", "-79.96243993", "edu", "", "United States", "2018"], ["Video Object Segmentation with Re-identification", "", "SenseTime", "SenseTime", "China, Beijing Shi, Haidian Qu, WuDaoKou, Zhongguancun E Rd, 1\u53f7-7", "39.99300800", "116.32988200", "company", "1 Zhongguancun E Rd, Haidian Qu, China", "China", "2017"], ["POL-LWIR Vehicle Detection: Convolutional Neural Networks Meet Polarised Infrared Sensors", "", "Heriot-Watt University", "Heriot-Watt University", "Heriot-Watt University - Edinburgh Campus, Third Gait, Currie, Gogarbank, City of Edinburgh, Scotland, EH14 4AS, UK", "55.91029135", "-3.32345777", "edu", "", "United Kingdom", "2018"], ["Videos as Space-Time Region Graphs", "", "Robotics Institute", "Robotics Institute", "Institute for Field Robotics, \u0e1b\u0e23\u0e30\u0e0a\u0e32\u0e2d\u0e38\u0e17\u0e34\u0e28, \u0e01\u0e23\u0e38\u0e07\u0e40\u0e17\u0e1e\u0e21\u0e2b\u0e32\u0e19\u0e04\u0e23, \u0e40\u0e02\u0e15\u0e23\u0e32\u0e29\u0e0e\u0e23\u0e4c\u0e1a\u0e39\u0e23\u0e13\u0e30, \u0e01\u0e23\u0e38\u0e07\u0e40\u0e17\u0e1e\u0e21\u0e2b\u0e32\u0e19\u0e04\u0e23, 10140, \u0e1b\u0e23\u0e30\u0e40\u0e17\u0e28\u0e44\u0e17\u0e22", "13.65450525", "100.49423171", "edu", "", "Thailand", "2018"], ["Object Detection via End-to-End Integration of Aspect Ratio and Context Aware Part-based Models and Fully Convolutional Networks", "", "North Carolina State University", "North Carolina State University", "North Carolina State University, Oval Drive, West Raleigh, Raleigh, Wake County, North Carolina, 27695, USA", "35.77184965", "-78.67408695", "edu", "", "United States", "2016"], ["Normalized Object Coordinate Space for Category-Level 6D Object Pose and Size Estimation", "", "Princeton University", "Princeton University", "Lot 9, University Place, Princeton Township, Mercer County, New Jersey, 08540, USA", "40.34829285", "-74.66308325", "edu", "", "United States", "2019"], ["Face2Text: Collecting an Annotated Image Description Corpus for the Generation of Rich Face Descriptions", "", "University of Copenhagen", "University of Copenhagen", "K\u00f8benhavns Universitet, Krystalgade, K\u00f8dbyen, Vesterbro, K\u00f8benhavn, K\u00f8benhavns Kommune, Region Hovedstaden, 1165, Danmark", "55.68015020", "12.57232700", "edu", "", "Denmark", "2018"], ["Textually Enriched Neural Module Networks for Visual Question Answering", "", "Carnegie Mellon University", "Carnegie Mellon University", "Carnegie Mellon University Silicon Valley, South Akron Road, ARC, Santa Clara County, California, 94035-0016, USA", "37.41021930", "-122.05965487", "edu", "", "United States", "2018"], ["Slum Segmentation and Change Detection : A Deep Learning Approach", "", "Indian Institute of Science Bangalore", "Indian Institute of Science Bangalore", "IISc, Gulmohar Marg, RMV Stage II - 1st Block, Aramane Nagara Ward, West Zone, Bengaluru, Bangalore Urban, Karnataka, 560012, India", "13.02223470", "77.56718325", "edu", "", "India", "2018"], ["Input Reconstruction Side and top down view Part Segmentation Input Reconstruction Side and top down view Part Segmentation", "", "University of California, Berkeley", "University of California, Berkeley", "Berkeley Art Museum and Pacific Film Archive, Bancroft Way, Southside, Berkeley, Alameda County, California, 94720-1076, USA", "37.86871260", "-122.25586815", "edu", "", "United States", "2017"], ["Large Scale Fine-Grained Categorization and Domain-Specific Transfer Learning", "", "Cornell University", "Cornell University", "Cornell University, Forest Home Drive, Forest Home, Tompkins County, New York, 14853, USA", "42.45055070", "-76.47835130", "edu", "", "United States", "2018"], ["Gather-Excite : Exploiting Feature Context in Convolutional Neural Networks", "", "University of Oxford", "University of Oxford", "Radcliffe Camera, Radcliffe Square, Grandpont, Oxford, Oxon, South East, England, OX1 4AJ, UK", "51.75345380", "-1.25400997", "edu", "", "United Kingdom", "2018"], ["Adversarial Removal of Gender from Deep Image Representations", "", "University of Virginia", "University of Virginia", "University of Virginia, Rotunda Alley, Carr's Hill, Albemarle County, Virginia, 22904-4119, USA", "38.03536820", "-78.50353220", "edu", "", "United States", "2018"], ["Regularizing Deep Networks by Modeling and Predicting Label Structure", "", "Toyota Technological Institute at Chicago", "Toyota Technological Institute at Chicago", "6045 S Kenwood Ave, Chicago, IL 60637, USA", "41.78469820", "-87.59258480", "company", "", "United States", "2018"], ["Probability-based Detection Quality (PDQ): A Probabilistic Approach to Detection Evaluation", "", "Queensland University of Technology (QUT)", "Queensland University of Technology (QUT)", "2 George St, Brisbane City QLD 4000, Australia", "-27.47735700", "153.02841500", "edu", "", "Australia", "2018"], ["Receptive Field Block Net for Accurate and Fast Object Detection", "", "Beihang University", "Beihang University", "\u5317\u4eac\u822a\u7a7a\u822a\u5929\u5927\u5b66, 37, \u5b66\u9662\u8def, \u4e94\u9053\u53e3, \u540e\u516b\u5bb6, \u6d77\u6dc0\u533a, 100083, \u4e2d\u56fd", "39.98083330", "116.34101249", "edu", "", "China", "2018"], ["SPNet: Superpixel Pyramid Network for Scene Parsing", "Faculty of Information Technology, Beijing University of Technologyy, Beijing, 100124, China", "Beijing University of Technologyy", "Faculty of Information Technology, Beijing University of Technologyy, Beijing, 100124, China", "Chaoyang, China, 100124", "39.87161100", "116.47952900", "edu", "", "China", "2018"], ["Unsupervised Learning of Important Objects from First-Person Videos", "", "University of Pennsylvania", "University of Pennsylvania", "Penn Museum, 3260, South Street, University City, Philadelphia, Philadelphia County, Pennsylvania, 19104, USA", "39.94923440", "-75.19198985", "edu", "", "United States", "2017"], ["Gather-Excite: Exploiting Feature Context in Convolutional Neural Networks", "", "University of Oxford", "University of Oxford", "Radcliffe Camera, Radcliffe Square, Grandpont, Oxford, Oxon, South East, England, OX1 4AJ, UK", "51.75345380", "-1.25400997", "edu", "", "United Kingdom", "2018"], ["Open-vocabulary Phrase Detection", "", "Boston University", "Boston University", "BU, Bay State Road, Fenway, Boston, Suffolk County, Massachusetts, 02215, USA", "42.35042530", "-71.10056114", "edu", "", "United States", "2018"], ["SHPD: Surveillance Human Pose Dataset and Performance Evaluation for Coarse-Grained Pose Estimation", "School of Electronic Information and Electrical Engineering, Shanghai Jiao Tong University, Shanghai, 200240, China", "Shanghai Jiao Tong University", "Shanghai Jiao Tong University", "\u4e0a\u6d77\u4ea4\u901a\u5927\u5b66\uff08\u5f90\u6c47\u6821\u533a\uff09, \u6dee\u6d77\u897f\u8def, \u756a\u79ba\u5c0f\u533a, \u5e73\u9634\u6865, \u5f90\u6c47\u533a, \u4e0a\u6d77\u5e02, 200052, \u4e2d\u56fd", "31.20081505", "121.42840681", "edu", "", "China", "2018"], ["Weakly Supervised Vehicle Detection in Satellite Images via Multiple Instance Ranking", "Fujian Key Laboratory of Sensing and Computing for Smart City, School of Information Science and Engineering, Xiamen University, 361005, P. R. China", "Xiamen University", "Xiamen University", "\u53a6\u95e8\u5927\u5b66, \u601d\u660e\u5357\u8def Siming South Road, \u601d\u660e\u533a, \u601d\u660e\u533a (Siming), \u53a6\u95e8\u5e02 / Xiamen, \u798f\u5efa\u7701, 361005, \u4e2d\u56fd", "24.43994190", "118.09301781", "edu", "", "China", "2018"], ["Towards Closing the Gap in Weakly Supervised Semantic Segmentation with DCNNs: Combining Local and Global Models.", "", "ETH Z\u00fcrich", "ETH Z\u00fcrich", "ETH Z\u00fcrich, 101, R\u00e4mistrasse, Hochschulen, Altstadt, Z\u00fcrich, Bezirk Z\u00fcrich, Z\u00fcrich, 8092, Schweiz/Suisse/Svizzera/Svizra", "47.37645340", "8.54770931", "edu", "", "Switzerland", "2018"], ["Learning to Interpret Satellite Images Using Wikipedia", "", "Stanford University", "Stanford University", "Stanford University, Memorial Way, Stanford, Santa Clara County, California, 94305-6015, USA", "37.43131385", "-122.16936535", "edu", "", "United States", "2018"], ["Pixel-wise object tracking", "", "New York University", "New York University", "NYU, West 4th Street, NoHo Historic District, NoHo, Manhattan, Manhattan Community Board 2, New York County, NYC, New York, 10012, USA", "40.72925325", "-73.99625394", "edu", "", "United States", "2017"], ["CNN+CNN: Convolutional Decoders for Image Captioning", "", "City University of Hong Kong", "City University of Hong Kong", "\u9999\u6e2f\u57ce\u5e02\u5927\u5b78 City University of Hong Kong, \u9054\u5eb7\u8def Tat Hong Avenue, \u5927\u7aa9\u576a Tai Wo Ping, \u6df1\u6c34\u57d7\u5340 Sham Shui Po District, \u4e5d\u9f8d Kowloon, HK, KIL 3348, \u4e2d\u56fd", "22.34000115", "114.16970291", "edu", "", "China", "2018"], ["Neurons Merging Layer: Towards Progressive Redundancy Reduction for Deep Supervised Hashing", "", "University of Chinese Academy of Sciences", "University of Chinese Academy of Sciences", "University of Chinese Academy of Sciences, UCAS, Yuquanlu, \u7389\u6cc9\u8def, \u7530\u6751, \u6d77\u6dc0\u533a, 100049, \u4e2d\u56fd", "39.90828040", "116.24585270", "edu", "", "China", "2018"], ["Learning Semantic Segmentation from Synthetic Data: A Geometrically Guided Input-Output Adaptation Approach", "", "ETH Zurich", "ETH Zurich", "R\u00e4mistrasse 101, 8092 Z\u00fcrich, Switzerland", "47.37631300", "8.54766990", "edu", "", "Switzerland", "2018"], ["End-to-End Airplane Detection Using Transfer Learning in Remote Sensing Images", "", "Huazhong University of Science and Technology", "Huazhong University of Science and Technology", "\u534e\u4e2d\u5927, \u73de\u55bb\u8def, \u4e1c\u6e56\u65b0\u6280\u672f\u5f00\u53d1\u533a, \u5173\u4e1c\u8857\u9053, \u4e1c\u6e56\u65b0\u6280\u672f\u5f00\u53d1\u533a\uff08\u6258\u7ba1\uff09, \u6d2a\u5c71\u533a (Hongshan), \u6b66\u6c49\u5e02, \u6e56\u5317\u7701, 430074, \u4e2d\u56fd", "30.50975370", "114.40628810", "edu", "", "China", "2018"], ["Playing for Benchmarks", "", "Intel Labs", "Intel Labs", "4720 Forbes Ave, Pittsburgh, PA 15213, USA", "40.44397890", "-79.94646340", "company", "", "United States", "2017"], ["Advances in deep learning approaches for image tagging", "", "Microsoft", "Microsoft Corporation, Redmond, WA, USA", "One Microsoft Way, Redmond, WA 98052, USA", "47.64233180", "-122.13693020", "company", "", "United States", "2017"], ["Multimodal Compact Bilinear Pooling for Visual Question Answering and Visual Grounding", "", "Max Planck Institute for Informatics", "Max Planck Institute for Informatics", "MPII, E1 4, Campus, Universit\u00e4t, Sankt Johann, Bezirk Mitte, Saarbr\u00fccken, Regionalverband Saarbr\u00fccken, Saarland, 66123, Deutschland", "49.25795660", "7.04577417", "edu", "", "Germany", "2016"], ["What Makes for Effective Detection Proposals?", "", "Max Planck Institute for Informatics", "Max Planck Institute for Informatics", "MPII, E1 4, Campus, Universit\u00e4t, Sankt Johann, Bezirk Mitte, Saarbr\u00fccken, Regionalverband Saarbr\u00fccken, Saarland, 66123, Deutschland", "49.25795660", "7.04577417", "edu", "", "Germany", "2016"], ["A cascaded long short-term memory (LSTM) driven generic visual question answering (VQA)", "Queensland University of Technology", "Queensland University of Technology", "Queensland University of Technology", "Queensland University of Technology, Macgregor Lane, Merthyr, South Brisbane, Brisbane, QLD, 4000, Australia", "-27.47715625", "153.02841004", "edu", "", "Australia", "2017"], ["Adaptive Object Detection Using Adjacency and Zoom Prediction", "", "University of Illinois, Urbana-Champaign", "University of Illinois, Urbana-Champaign", "B-3, South Mathews Avenue, Urbana, Champaign County, Illinois, 61801, USA", "40.11116745", "-88.22587665", "edu", "", "United States", "2016"], ["Shallow and Deep Convolutional Networks for Saliency Prediction", "", "Dublin City University", "DUBLIN CITY UNIVERSITY", "Dublin City University Glasnevin Campus, Lower Car Park, Wad, Whitehall A ED, Dublin 9, Dublin, County Dublin, Leinster, D09 FW22, Ireland", "53.38522185", "-6.25740874", "edu", "", "Ireland", "2016"], ["Self-Supervised Learning of Visual Features through Embedding Images into Text Topic Spaces", "", "CVIT, KCIS, IIIT Hyderabad, India", "CVIT, KCIS, IIIT Hyderabad, India", "IIIT, Gachibowli, Gachibowli, Hyderabad, Telangana 500032, India", "17.44509810", "78.34976780", "edu", "", "India", "2017"], ["Backdoor Embedding in Convolutional Neural Network Models via Invisible Perturbation", "", "Pennsylvania State University", "Pennsylvania State University", "Old Main, State College, PA 16801, USA", "40.79821330", "-77.85990840", "edu", "", "United States", "2018"], ["Pixel Objectness", "", "University of Texas at Austin", "University of Texas at Austin", "University of Texas at Austin, 1, East 23rd Street, The Drag, Austin, Travis County, Texas, 78712, USA", "30.28415100", "-97.73195598", "edu", "", "United States", "2017"], ["Semi-automatic video object segmentation by advanced manipulation of segmentation hierarchies", "Disney Research Zurich", "Disney Research Zurich", "Disney Research Zurich", "Stampfenbachstrasse 48, 8006 Z\u00fcrich, Switzerland", "47.38047690", "8.54299640", "company", "", "Switzerland", "2015"], ["VADRA: Visual Adversarial Domain Randomization and Augmentation", "", "Carnegie Mellon University", "Carnegie Mellon University", "Carnegie Mellon University Silicon Valley, South Akron Road, ARC, Santa Clara County, California, 94035-0016, USA", "37.41021930", "-122.05965487", "edu", "", "United States", "2018"], ["Zero-Shot Object Detection", "", "NEC Labs America", "NEC Labs America", "4 Independence Way #200, Princeton, NJ 08540, USA", "40.35981820", "-74.59502250", "company", "", "United States", "2018"], ["Automatic Semantic Content Removal by Learning to Neglect.", "", "University of California", "University of California", "Berkeley, CA, USA", "37.87189920", "-122.25853990", "edu", "", "United States", "2018"], ["Directional Edge Boxes: Exploiting Inner Normal Direction Cues for Effective Object Proposal Generation", "School of Electronic Information and Communications, Huazhong University of Science and Technology, Wuhan, China", "Huazhong University of Science and Technology", "Huazhong University of Science and Technology", "\u534e\u4e2d\u5927, \u73de\u55bb\u8def, \u4e1c\u6e56\u65b0\u6280\u672f\u5f00\u53d1\u533a, \u5173\u4e1c\u8857\u9053, \u4e1c\u6e56\u65b0\u6280\u672f\u5f00\u53d1\u533a\uff08\u6258\u7ba1\uff09, \u6d2a\u5c71\u533a (Hongshan), \u6b66\u6c49\u5e02, \u6e56\u5317\u7701, 430074, \u4e2d\u56fd", "30.50975370", "114.40628810", "edu", "", "China", "2017"], ["Cut, Paste and Learn: Surprisingly Easy Synthesis for Instance Detection", "", "Carnegie Mellon University", "Carnegie Mellon University", "Carnegie Mellon University Silicon Valley, South Akron Road, ARC, Santa Clara County, California, 94035-0016, USA", "37.41021930", "-122.05965487", "edu", "", "United States", "2017"], ["On the Effects of Spam Filtering and Incremental Learning for Web-Supervised Visual Concept Classification", "German National Library of Science and Technology & Leibniz Universit\u00e4t Hannover, Hannover, Germany", "Leibniz Universit\u00e4t Hannover, Hannover, Germany", "Leibniz Universit\u00e4t Hannover, Hannover, Germany", "Welfengarten 1, 30167 Hannover, Germany", "52.38296410", "9.71969890", "edu", "", "Germany", "2016"], ["Learning Visually-Grounded Semantics from Contrastive Adversarial Samples", "", "Tsinghua University", "Tsinghua University", "\u6e05\u534e\u5927\u5b66, 30, \u53cc\u6e05\u8def, \u4e94\u9053\u53e3, \u540e\u516b\u5bb6, \u6d77\u6dc0\u533a, 100084, \u4e2d\u56fd", "40.00229045", "116.32098908", "edu", "", "China", "2018"], ["Generation and Comprehension of Unambiguous Object Descriptions", "", "University of Oxford", "University of Oxford", "Radcliffe Camera, Radcliffe Square, Grandpont, Oxford, Oxon, South East, England, OX1 4AJ, UK", "51.75345380", "-1.25400997", "edu", "", "United Kingdom", "2016"], ["Visual Question Answering Dataset for Bilingual Image Understanding: A Study of Cross-Lingual Transfer Using Attention Maps", "", "Tokyo Institute of Technology", "Tokyo Institute of Technology", "\u6771\u4eac\u5de5\u696d\u5927\u5b66, \u539a\u6728\u8857\u9053, \u7dd1\u533a, \u753a\u7530\u5e02, \u795e\u5948\u5ddd\u770c, \u95a2\u6771\u5730\u65b9, 226-0026, \u65e5\u672c", "35.51675380", "139.48342251", "edu", "", "Japan", "2018"], ["Event Specific Multimodal Pattern Mining for Knowledge Base Construction", "Rensselaer Polytechnic Institute, Troy, NY, USA", "Rensselaer Polytechnic Institute", "Rensselaer Polytechnic Institute", "Rensselaer Polytechnic Institute, Sage Avenue, Downtown, City of Troy, Rensselaer County, New York, 12180, USA", "42.72984590", "-73.67950216", "edu", "", "United States", "2016"], ["Bachelor Project Image Captioning with Convolutional Neural Networks", "", "Czech Technical University", "Czech Technical University", "\u010cesk\u00e9 vysok\u00e9 u\u010den\u00ed technick\u00e9 v Praze, Resslova, Nov\u00e9 M\u011bsto, Praha, okres Hlavn\u00ed m\u011bsto Praha, Hlavn\u00ed m\u011bsto Praha, Praha, 11121, \u010cesko", "50.07642960", "14.41802312", "edu", "", "Czech Republic", "2017"], ["Asking for Help with the Right Question by Predicting Human Visual Performance", "", "University of California, Santa Barbara", "University of California, Santa Barbara", "UCSB, Santa Barbara County, California, 93106, USA", "34.41459370", "-119.84581950", "edu", "", "United States", "2016"], ["What value high level concepts in vision to language problems ?", "", "University of Adelaide", "University of Adelaide", "University of Adelaide, North Terrace, Adelaide, 5000, City of Adelaide, South Australia, 5000, Australia", "-34.91892260", "138.60423668", "edu", "", "Australia", "2015"], ["Training Deep Networks with Structured Layers by Matrix Backpropagation", "", "University of Bonn", "University of Bonn", "Rheinische Friedrich-Wilhelms-Universit\u00e4t Bonn, Arkadenhof, Bonn-Zentrum, Stadtbezirk Bonn, Bonn, Regierungsbezirk K\u00f6ln, Nordrhein-Westfalen, 53113, Deutschland", "50.73381240", "7.10224650", "edu", "", "Germany", "2015"], ["TRAFFIC ANALYSIS USING VISUAL OBJECT DETECTION AND TRACKING", "", "University of Chinese Academy of Sciences", "University of Chinese Academy of Sciences", "University of Chinese Academy of Sciences, UCAS, Yuquanlu, \u7389\u6cc9\u8def, \u7530\u6751, \u6d77\u6dc0\u533a, 100049, \u4e2d\u56fd", "39.90828040", "116.24585270", "edu", "", "China", "2017"], ["Fast Neural Architecture Search of Compact Semantic Segmentation Models via Auxiliary Cells.", "", "University of Adelaide", "University of Adelaide", "University of Adelaide, North Terrace, Adelaide, 5000, City of Adelaide, South Australia, 5000, Australia", "-34.91892260", "138.60423668", "edu", "", "Australia", "2018"], ["Image captioning based on deep reinforcement learning", "", "Beijing, China", "Beijing, China", "Beijing, China", "39.90419990", "116.40739630", "edu", "", "China", "2018"], ["What Action Causes This? Towards Naive Physical Action-Effect Prediction", "", "Microsoft", "Microsoft Corporation, Redmond, WA, USA", "One Microsoft Way, Redmond, WA 98052, USA", "47.64233180", "-122.13693020", "company", "", "United States", "2018"], ["Controllable Top-down Feature Transformer", "", "University of California, San Diego", "University of California, San Diego", "UCSD, 9500, Gilman Drive, Sixth College, University City, San Diego, San Diego County, California, 92093, USA", "32.87935255", "-117.23110049", "edu", "", "United States", "2017"], ["Natural Language Driven Image Edits using a Semantic Image Manipulation Language (SIMPL)", "", "Virginia Tech", "Virginia Tech", "Blacksburg, VA 24061, USA", "37.22838430", "-80.42341670", "edu", "", "United States", "2018"], ["The Impact of Visual Saliency Prediction in Image Classification", "", "Dublin City University", "DUBLIN CITY UNIVERSITY", "Dublin City University Glasnevin Campus, Lower Car Park, Wad, Whitehall A ED, Dublin 9, Dublin, County Dublin, Leinster, D09 FW22, Ireland", "53.38522185", "-6.25740874", "edu", "", "Ireland", "2017"], ["Oracle Performance for Visual Captioning", "", "New York University", "New York University", "NYU, West 4th Street, NoHo Historic District, NoHo, Manhattan, Manhattan Community Board 2, New York County, NYC, New York, 10012, USA", "40.72925325", "-73.99625394", "edu", "", "United States", "2016"], ["Linguistic Unit Discovery from Multi-Modal Inputs in Unwritten Languages: Summary of the \u201cSpeaking Rosetta\u201d JSALT 2017 Workshop", "", "University of Illinois, Urbana-Champaign", "University of Illinois, Urbana-Champaign", "B-3, South Mathews Avenue, Urbana, Champaign County, Illinois, 61801, USA", "40.11116745", "-88.22587665", "edu", "", "United States", "2018"], ["Boosted Attention: Leveraging Human Attention for Image Captioning", "", "University of Minnesota", "University of Minnesota", "WeismanArt, 333, East River Parkway, Marcy-Holmes, Phillips, Minneapolis, Hennepin County, Minnesota, 55455, USA", "44.97308605", "-93.23708813", "edu", "", "United States", "2018"], ["Road Damage Detection And Classification In Smartphone Captured Images Using Mask R-CNN", "", "India", "India", "India", "20.59368400", "78.96288000", "edu", "", "", "2018"], ["Fast Efficient Object Detection Using Selective Attention", "", "University of Sydney", "University of Sydney", "USyd, Fisher Road, Camperdown, Sydney, NSW, 2006, Australia", "-33.88890695", "151.18943366", "edu", "", "Australia", "2018"], ["ScratchDet: Exploring to Train Single-Shot Object Detectors from Scratch", "", "University of Chinese Academy of Sciences", "University of Chinese Academy of Sciences", "University of Chinese Academy of Sciences, UCAS, Yuquanlu, \u7389\u6cc9\u8def, \u7530\u6751, \u6d77\u6dc0\u533a, 100049, \u4e2d\u56fd", "39.90828040", "116.24585270", "edu", "", "China", "2018"], ["Design Pseudo Ground Truth with Motion Cue for Unsupervised Video Object Segmentation.", "", "National Taiwan University", "National Taiwan University", "\u81fa\u5927;\u53f0\u5927, 1, \u7f85\u65af\u798f\u8def\u56db\u6bb5, \u5b78\u5e9c\u91cc, \u5927\u5b89\u5340, \u81fa\u5317\u5e02, 10617, \u81fa\u7063", "25.01682835", "121.53846924", "edu", "", "Taiwan", "2018"], ["Partially-Supervised Image Captioning", "", "Australian National University", "Australian National University", "Canberra ACT 0200, Australia", "-35.27769990", "149.11852700", "edu", "", "Australia", "2018"], ["Rank of Experts: Detection Network Ensemble", "", "Electronics and Telecommunications Research Institute, Daejeon, South Korea", "Electronics and Telecommunications Research Institute, Daejeon, South Korea", "Electronics and Telecommunications Research Institute, Sinseong-dong, Daejeon, South Korea", "36.38376500", "127.36694000", "edu", "", "South Korea", "2017"], ["Emergent Translation in Multi-Agent Communication", "", "New York University", "New York University", "NYU, West 4th Street, NoHo Historic District, NoHo, Manhattan, Manhattan Community Board 2, New York County, NYC, New York, 10012, USA", "40.72925325", "-73.99625394", "edu", "", "United States", "2017"], ["Tag-based video retrieval by embedding semantic content in a continuous word space", "", "University of Amsterdam", "University of Amsterdam", "Institute for Logic, Language and Computation (ILLC), 107, Science Park, Oost-Watergraafsmeer, Amsterdam, Oost, Amsterdam, Noord-Holland, Nederland, 1098XG, Nederland", "52.35536550", "4.95016440", "edu", "", "Netherlands", "2016"], ["FastMask: Segment Multi-scale Object Candidates in One Shot", "", "Fudan University", "Fudan University", "\u590d\u65e6\u5927\u5b66, 220, \u90af\u90f8\u8def, \u4e94\u89d2\u573a\u8857\u9053, \u6768\u6d66\u533a, \u4e0a\u6d77\u5e02, 200433, \u4e2d\u56fd", "31.30104395", "121.50045497", "edu", "", "China", "2017"], ["Beyond Pixels: A Comprehensive Survey from Bottom-up to Semantic Image Segmentation and Cosegmentation", "", "Nanyang Technological University", "Nanyang Technological University", "NTU, Faculty Avenue, Jurong West, Southwest, 637460, Singapore", "1.34841040", "103.68297965", "edu", "", "Singapore", "2016"], ["Looking at Hands in Autonomous Vehicles: A ConvNet Approach using Part Affinity Fields", "", "University of California, San Diego", "University of California, San Diego", "UCSD, 9500, Gilman Drive, Sixth College, University City, San Diego, San Diego County, California, 92093, USA", "32.87935255", "-117.23110049", "edu", "", "United States", "2018"], ["Learning visual attribute from image and text \u2217", "", "Tohoku University", "Tohoku University", "Tohoku University, \u4e94\u6a4b\u901a, \u9752\u8449\u533a, \u4ed9\u53f0\u5e02, \u5bae\u57ce\u770c, \u6771\u5317\u5730\u65b9, 980-0811, \u65e5\u672c", "38.25309450", "140.87365930", "edu", "", "Japan", "2015"], ["Adopting Abstract Images for Semantic Scene Understanding", "Microsoft Research, One Microsoft Way, Redmond, WA", "Microsoft", "Microsoft Corporation, Redmond, WA, USA", "One Microsoft Way, Redmond, WA 98052, USA", "47.64233180", "-122.13693020", "company", "", "United States", "2016"], ["Indirect deep structured learning for 3D human body shape and pose prediction.", "", "University of Cambridge", "University of Cambridge", "Clifford Allbutt Lecture Theatre, Robinson Way, Romsey, Cambridge, Cambridgeshire, East of England, England, CB2 0QH, UK", "52.17638955", "0.14308882", "edu", "", "United Kingdom", "2017"], ["Tackling Low Resolution for Better Scene Understanding", "", "India", "India", "India", "20.59368400", "78.96288000", "edu", "", "", "2018"], ["Add English to image Chinese captioning", "PDL, National Laboratory for Parallel and Distributed Processing, NUDT, National University of Defense Technology, Changsha, China", "National University of Defense Technology, China", "National University of Defence Technology, Changsha 410000, China", "\u56fd\u9632\u79d1\u5b66\u6280\u672f\u5927\u5b66, \u4e09\u4e00\u5927\u9053, \u5f00\u798f\u533a, \u5f00\u798f\u533a (Kaifu), \u957f\u6c99\u5e02 / Changsha, \u6e56\u5357\u7701, 410073, \u4e2d\u56fd", "28.22902090", "112.99483204", "mil", "", "China", "2017"], ["Deep Generative Models for Weakly-Supervised Multi-Label Classification", "", "Carnegie Mellon University", "Carnegie Mellon University", "Carnegie Mellon University Silicon Valley, South Akron Road, ARC, Santa Clara County, California, 94035-0016, USA", "37.41021930", "-122.05965487", "edu", "", "United States", "2018"], ["Visual Question Answering : Datasets , Methods , Challenges and Oppurtunities", "", "Princeton University", "Princeton University", "Lot 9, University Place, Princeton Township, Mercer County, New Jersey, 08540, USA", "40.34829285", "-74.66308325", "edu", "", "United States", "2018"], ["Learning 3D Scene Synthesis from Annotated RGB-D Images", "", "Zhejiang University", "Zhejiang University", "\u6d59\u6c5f\u5927\u5b66\u4e4b\u6c5f\u6821\u533a, \u4e4b\u6c5f\u8def, \u8f6c\u5858\u8857\u9053, \u897f\u6e56\u533a (Xihu), \u676d\u5dde\u5e02 Hangzhou, \u6d59\u6c5f\u7701, 310008, \u4e2d\u56fd", "30.19331415", "120.11930822", "edu", "", "China", "2016"], ["Active Grounding of Visual Situations", "", "Santa Fe Institute", "Santa Fe Institute", "Santa Fe Institute, Hyde Park Road, Santa Fe, Santa Fe County, New Mexico, 87501, USA", "35.70028780", "-105.90864847", "edu", "", "United States", "2017"], ["A two-stage training deep neural network for small pedestrian detection", "Graduate School of Science and Engineering, Teikyo University", "Teikyo University", "Teikyo University", "Japan, \u3012173-8605 Tokyo, \u677f\u6a4b\u533a\u52a0\u8cc0\uff12\u4e01\u76ee\uff11\uff11\u2212\uff11", "35.75927460", "139.71450290", "edu", "", "Japan", "2017"], ["ABC-CNN: An Attention Based Convolutional Neural Network for Visual Question Answering", "", "University of Southern California", "University of Southern California", "University of Southern California, Watt Way, Saint James Park, LA, Los Angeles County, California, 90089, USA", "34.02241490", "-118.28634407", "edu", "", "United States", "2015"], ["A New Deep Learning-Based Food Recognition System for Dietary Assessment on An Edge Computing Service Infrastructure", "University of Massachusetts, Lowell, MA", "University of Massachusetts", "University of Massachusetts", "University of Massachusetts, Hicks Way, Amherst, Hampshire, Massachusetts, 01003, USA", "42.38897850", "-72.52869870", "edu", "", "United States", "2018"], ["Rethinking the Smaller-Norm-Less-Informative Assumption in Channel Pruning of Convolution Layers", "", "The Pennsylvania State University", "The Pennsylvania State University", "Old Main, State College, PA 16801, USA", "40.79821330", "-77.85990840", "edu", "", "United States", "2018"], ["Complex event processing for content-based text, image, and video retrieval", "United States Air Force Research Laboratory, Dayton, OH", "United States Air Force Research Laboratory, Dayton, OH", "United States Air Force Research Laboratory, Dayton, OH", "1864 4th St, Wright-Patterson AFB, OH 45433, USA", "39.79084110", "-84.09897580", "mil", "", "United States", "2016"], ["Non-parametric Structured Output Networks", "", "Disney Research", "Disney Research", "521 Circle 7 Dr, Glendale, CA 91201, USA", "34.15797420", "-118.28947290", "company", "", "United States", "2017"], ["A Rotation Invariant Latent Factor Model for Moveme Discovery from Static Poses", "", "California Institute of Technology", "California Institute of Technology", "California Institute of Technology, San Pasqual Walk, Madison Heights, Pasadena, Los Angeles County, California, 91126, USA", "34.13710185", "-118.12527487", "edu", "", "United States", "2016"], ["Bidirectional Long-Short Term Memory for Video Description", "", "University of Queensland", "University of Queensland", "University of Queensland, University Drive, Hill End, St Lucia, Brisbane, QLD, 4072, Australia", "-27.49741805", "153.01316956", "edu", "", "Australia", "2016"], ["Recurrent Topic-Transition GAN for Visual Paragraph Generation", "", "Carnegie Mellon University", "Carnegie Mellon University", "Carnegie Mellon University Silicon Valley, South Akron Road, ARC, Santa Clara County, California, 94035-0016, USA", "37.41021930", "-122.05965487", "edu", "", "United States", "2017"], ["Beyond Forward Shortcuts: Fully Convolutional Master-Slave Networks (MSNets) with Backward Skip Connections for Semantic Segmentation", "", "University of Illinois, Urbana-Champaign", "University of Illinois, Urbana-Champaign", "B-3, South Mathews Avenue, Urbana, Champaign County, Illinois, 61801, USA", "40.11116745", "-88.22587665", "edu", "", "United States", "2017"], ["A Reinforcement Learning Framework for Natural Question Generation using Bi-discriminators", "", "Fudan University", "Fudan University", "\u590d\u65e6\u5927\u5b66, 220, \u90af\u90f8\u8def, \u4e94\u89d2\u573a\u8857\u9053, \u6768\u6d66\u533a, \u4e0a\u6d77\u5e02, 200433, \u4e2d\u56fd", "31.30104395", "121.50045497", "edu", "", "China", "2018"], ["VSE++: Improving Visual-Semantic Embeddings with Hard Negatives", "", "University of Toronto", "University of Toronto", "University of Toronto, St. George Street, Bloor Street Culture Corridor, Old Toronto, Toronto, Ontario, M5S 1A5, Canada", "43.66333345", "-79.39769975", "edu", "", "Canada", "2018"], ["NLE@MediaEval'17: Combining Cross-Media Similarity and Embeddings for Retrieving Diverse Social Images", "", "Naver Labs Europe, Meylan, France", "Naver Labs Europe, Meylan, France", "6 Chemin de Maupertuis, 38240 Meylan, France", "45.21739890", "5.79213490", "edu", "", "France", "2017"], ["Accelerating Machine Learning Inference with Probabilistic Predicates", "Princeton University &Microsoft, Princeton, NJ, USA", "Princeton University &Microsoft", "Princeton University &Microsoft, Princeton, NJ, USA", "Princeton, NJ 08544, USA", "40.34398880", "-74.65144810", "edu", "", "United States", "2018"], ["Actor-Critic Sequence Training for Image Captioning", "", "University of Edinburgh", "University of Edinburgh", "New College, New College Courtyard, The Mound, Old Town, Edinburgh, City of Edinburgh, Scotland, EH1 2LX, UK", "55.94951105", "-3.19534913", "edu", "", "United Kingdom", "2017"], ["Neural Image Captioning for Intelligent Vehicle-to-Passenger Communication", "", "Stanford University", "Stanford University", "Stanford University, Memorial Way, Stanford, Santa Clara County, California, 94305-6015, USA", "37.43131385", "-122.16936535", "edu", "", "United States", "2017"], ["Hybrid Supervised-unsupervised Image Topic Visualization with Convolutional Neural Network and LDA", "", "Indiana University", "Indiana University", "Indiana University East, West Cart Road, Richmond, Wayne County, Indiana, 47374, USA", "39.86948105", "-84.87956905", "edu", "", "United States", "2017"], ["Image captioning in Turkish with subword units", "Bilgisayar M\u00fchendisli\u011fi B\u00f6l\u00fcm\u00fc, Hacettepe \u00dcniversitesi, Ankara, T\u00fcrkiye", "Bilgisayar M\u00fchendisli\u011fi B\u00f6l\u00fcm\u00fc, Hacettepe \u00dcniversitesi, Ankara, T\u00fcrkiye", "Bilgisayar M\u00fchendisli\u011fi B\u00f6l\u00fcm\u00fc, Hacettepe \u00dcniversitesi, Ankara, T\u00fcrkiye", "\u00dcniversiteler Mh., Hacettepe Beytepe Kamp\u00fcs\u00fc No:21, 06800 \u00c7ankaya/Ankara, Turkey", "39.87143010", "32.73636570", "edu", "", "Turkey", "2018"], ["Cross-linguistic differences and similarities in image descriptions", "", "University of Edinburgh", "University of Edinburgh", "New College, New College Courtyard, The Mound, Old Town, Edinburgh, City of Edinburgh, Scotland, EH1 2LX, UK", "55.94951105", "-3.19534913", "edu", "", "United Kingdom", "2017"], ["Comixify: Transform video into a comics", "", "Warsaw University of Technology", "Warsaw University of Technology", "Politechnika Warszawska, 1, Plac Politechniki, VIII, \u015ar\u00f3dmie\u015bcie, Warszawa, mazowieckie, 00-661, RP", "52.22165395", "21.00735776", "edu", "", "Poland", "2018"], ["Fine-grained Video Retrieval using Query Phrases \u2014 Waseda_Meisei TRECVID 2017 AVS System \u2014", "Faculty of Science and Engineering, Waseda University, Tokyo, 162-0042, Japan", "Waseda University", "Waseda University", "\u65e9\u7a32\u7530\u5927\u5b66 \u5317\u4e5d\u5dde\u30ad\u30e3\u30f3\u30d1\u30b9, 2-2, \u6709\u6bdb\u5f15\u91ce\u7dda, \u516b\u5e61\u897f\u533a, \u5317\u4e5d\u5dde\u5e02, \u798f\u5ca1\u770c, \u4e5d\u5dde\u5730\u65b9, 808-0135, \u65e5\u672c", "33.88987280", "130.70856205", "edu", "", "Japan", "2018"], ["DSOD: Learning Deeply Supervised Object Detectors from Scratch", "", "Fudan University", "Fudan University", "\u590d\u65e6\u5927\u5b66, 220, \u90af\u90f8\u8def, \u4e94\u89d2\u573a\u8857\u9053, \u6768\u6d66\u533a, \u4e0a\u6d77\u5e02, 200433, \u4e2d\u56fd", "31.30104395", "121.50045497", "edu", "", "China", "2017"], ["Exploiting Negative Evidence for Deep Latent Structured Models", "Sorbonne Universit\u00e9s, Paris, France", "CEDRIC-Conservatoire National des Arts et M\u00e9tiers, Paris, France", "CEDRIC-Conservatoire National des Arts et M\u00e9tiers, Paris, France", "32 Rue du Faubourg Saint-Martin, 75010 Paris, France", "48.87008750", "2.35638710", "edu", "", "France", "2018"], ["Detecting Animals in Infrared Images from Camera-Traps", "Research, MVTec Software GmbH, Munich, Germany", "Research, MVTec Software GmbH, Munich, Germany", "Research, MVTec Software GmbH, Munich, Germany", "Arnulfstra\u00dfe 205, 80634 M\u00fcnchen, Germany", "48.14952580", "11.52082560", "edu", "", "Germany", "2018"], ["PIRC Net : Using Proposal Indexing, Relationships and Context for Phrase Grounding", "", "University of Southern California", "University of Southern California", "University of Southern California, Watt Way, Saint James Park, LA, Los Angeles County, California, 90089, USA", "34.02241490", "-118.28634407", "edu", "", "United States", "2018"], ["Learning Unsupervised Visual Grounding Through Semantic Self-Supervision.", "", "Carnegie Mellon University", "Carnegie Mellon University", "Carnegie Mellon University Silicon Valley, South Akron Road, ARC, Santa Clara County, California, 94035-0016, USA", "37.41021930", "-122.05965487", "edu", "", "United States", "2018"], ["Title Multi-Object Classification and Unsupervised Scene Understanding Using Deep Learning Features and Latent Tree Probabilistic Models Permalink", "", "University of California", "University of California", "Berkeley, CA, USA", "37.87189920", "-122.25853990", "edu", "", "United States", "2015"], ["Recurrent Pixel Embedding for Instance Grouping", "", "University of California, Irvine", "University of California, Irvine", "Irvine, CA 92697, USA", "33.64049520", "-117.84429620", "edu", "", "", "2018"], ["Distorting Neural Representations to Generate Highly Transferable Adversarial Examples", "", "Australian National University", "Australian National University", "Canberra ACT 0200, Australia", "-35.27769990", "149.11852700", "edu", "", "Australia", "2018"], ["Neural Motifs: Scene Graph Parsing with Global Context", "", "Carnegie Mellon University", "Carnegie Mellon University", "Carnegie Mellon University Silicon Valley, South Akron Road, ARC, Santa Clara County, California, 94035-0016, USA", "37.41021930", "-122.05965487", "edu", "", "United States", "2018"], ["Artistic Image Generation from Sketch by Using Conditional Adversarial Network and Style Feature Transform", "", "Wuhan University of Technology", "Wuhan University of Technology", "\u6b66\u6c49\u7406\u5de5\u5927\u5b66-\u4f59\u5bb6\u5934\u6821\u533a, \u4ea4\u901a\u4e8c\u8def, \u6768\u56ed\u8857\u9053, \u6b66\u660c\u533a (Wuchang), \u6b66\u6c49\u5e02, \u6e56\u5317\u7701, 430062, \u4e2d\u56fd", "30.60903415", "114.35142840", "edu", "", "China", "2018"], ["C-WSL: Count-Guided Weakly Supervised Localization", "", "University of Maryland", "University of Maryland", "The Grand Garage, 5, North Paca Street, Seton Hill, Baltimore, Maryland, 21201, USA", "39.28996850", "-76.62196103", "edu", "", "United States", "2018"], ["Non-local RoI for Cross-Object Perception", "", "Academia Sinica, Taiwan", "Academia Sinica, Taiwan", "No. 128\u865f, Section 2, Academia Rd, Nangang District, Taipei City, Taiwan 11529", "25.04218520", "121.61454770", "edu", "", "Taiwan", "2018"], ["Learning from Multiview Correlations in Open-Domain Videos", "", "Imperial College London", "Imperial College London", "Imperial College London, Exhibition Road, Brompton, Royal Borough of Kensington and Chelsea, London, Greater London, England, SW7 2AZ, UK", "51.49887085", "-0.17560797", "edu", "", "United Kingdom", "2018"], ["Exploring the Design Space of Deep Convolutional Neural Networks at Large Scale", "", "University of California, Berkeley", "University of California, Berkeley", "Berkeley Art Museum and Pacific Film Archive, Bancroft Way, Southside, Berkeley, Alameda County, California, 94720-1076, USA", "37.86871260", "-122.25586815", "edu", "", "United States", "2016"], ["BING++: A Fast High Quality Object Proposal Generator at 100fps", "", "Nankai University", "Nankai University", "94 Weijin Rd, Nankai Qu, China, 300071", "39.10394430", "117.17422320", "edu", "", "", "2015"], ["Actor-Action Semantic Segmentation with Region Masks", "", "Wuhan University of Technology", "Wuhan University of Technology", "\u6b66\u6c49\u7406\u5de5\u5927\u5b66-\u4f59\u5bb6\u5934\u6821\u533a, \u4ea4\u901a\u4e8c\u8def, \u6768\u56ed\u8857\u9053, \u6b66\u660c\u533a (Wuchang), \u6b66\u6c49\u5e02, \u6e56\u5317\u7701, 430062, \u4e2d\u56fd", "30.60903415", "114.35142840", "edu", "", "China", "2018"], ["Stability Based Filter Pruning for Accelerating Deep CNNs", "", "IIT Kanpur", "IIT Kanpur", "Kalyanpur, Kanpur, Uttar Pradesh 208016, India", "26.51233880", "80.23290000", "edu", "", "India", "2018"], ["4D Generic Video Object Proposals", "", "RWTH Aachen University", "RWTH Aachen University", "RWTH Aachen, Mies-van-der-Rohe-Stra\u00dfe, K\u00f6nigsh\u00fcgel, Aachen-Mitte, Aachen, St\u00e4dteregion Aachen, Regierungsbezirk K\u00f6ln, Nordrhein-Westfalen, 52074, Deutschland", "50.77917030", "6.06728733", "edu", "", "Germany", "2019"], ["Self-Supervised Adversarial Hashing Networks for Cross-Modal Retrieval", "", "University of Sydney", "University of Sydney", "USyd, Fisher Road, Camperdown, Sydney, NSW, 2006, Australia", "-33.88890695", "151.18943366", "edu", "", "Australia", "2018"], ["Active Transfer Learning with Zero-Shot Priors: Reusing Past Datasets for Future Tasks", "", "University of Amsterdam", "University of Amsterdam", "Institute for Logic, Language and Computation (ILLC), 107, Science Park, Oost-Watergraafsmeer, Amsterdam, Oost, Amsterdam, Noord-Holland, Nederland, 1098XG, Nederland", "52.35536550", "4.95016440", "edu", "", "Netherlands", "2015"], ["Question Part Relevance and Editing for Cooperative and Context-Aware VQA (C2VQA)", "Universit\u00e0 di Salerno, Dipartimento di Informatica, Fisciano, Italy", "Universit\u00e0 di Salerno, Dipartimento di Informatica, Fisciano, Italy", "Universit\u00e0 di Salerno, Dipartimento di Informatica, Fisciano, Italy", "Universit\u00e0 di Salerno Via Papa, Via Giovanni Paolo II, 132, 84084 Fisciano SA, Italy", "40.77434920", "14.78901500", "edu", "", "Italy", "2017"], ["Finding Tiny Faces", "", "Carnegie Mellon University", "Carnegie Mellon University", "Carnegie Mellon University Silicon Valley, South Akron Road, ARC, Santa Clara County, California, 94035-0016, USA", "37.41021930", "-122.05965487", "edu", "", "United States", "2017"], ["Multiview Cross-supervision for Semantic Segmentation", "", "University of Minnesota", "University of Minnesota", "WeismanArt, 333, East River Parkway, Marcy-Holmes, Phillips, Minneapolis, Hennepin County, Minnesota, 55455, USA", "44.97308605", "-93.23708813", "edu", "", "United States", "2018"], ["Asymmetric Deep Supervised Hashing", "", "Nanjing University", "Nanjing University", "NJU, \u4e09\u6c5f\u8def, \u9f13\u697c\u533a, \u5357\u4eac\u5e02, \u6c5f\u82cf\u7701, 210093, \u4e2d\u56fd", "32.05659570", "118.77408833", "edu", "", "China", "2018"], ["Simple Baseline for Visual Question Answering", "", "MIT", "Massachusetts Institute", "MIT, Amherst Street, Cambridgeport, Cambridge, Middlesex County, Massachusetts, 02238, USA", "42.35839610", "-71.09567788", "edu", "", "United States", "2015"], ["SPICE: Semantic Propositional Image Caption Evaluation", "", "Macquarie University", "Macquarie University, Sydney, Australia", "Balaclava Rd, Macquarie Park NSW 2109, Australia", "-33.77382370", "151.11264980", "edu", "", "Australia", "2016"], ["Image Captioning with Text-Based Visual Attention", "School of Electronics and Information Engineering, Sun Yat-sen University, Guangzhou, China", "Sun Yat-Sen University", "Sun Yat-Sen University", "\u4e2d\u5927, \u65b0\u6e2f\u897f\u8def, \u9f99\u8239\u6ed8, \u5eb7\u4e50, \u6d77\u73e0\u533a (Haizhu), \u5e7f\u5dde\u5e02, \u5e7f\u4e1c\u7701, 510105, \u4e2d\u56fd", "23.09461185", "113.28788994", "edu", "", "China", "2018"], ["CBAM: Convolutional Block Attention Module", "", "Adobe Research, San Jose, CA, USA", "Adobe Research, San Jose, CA, USA", "San Jose, CA, USA", "37.33820820", "-121.88632860", "edu", "", "United States", "2018"], ["Panoptic Segmentation with a Joint Semantic and Instance Segmentation Network", "", "TU Eindhoven", "TU Eindhoven", "Technische Universiteit Eindhoven, 2, De Rondom, Villapark, Eindhoven, Noord-Brabant, Nederland, 5600 MB, Nederland", "51.44866020", "5.49039957", "edu", "", "Netherlands", "2018"], ["Semantic soft segmentation", "MIT CSAIL and ETH Z\u00fcrich, Switzerland", "MIT CSAIL and ETH Z\u00fcrich, Switzerland", "MIT CSAIL and ETH Z\u00fcrich, Switzerland", "32 Vassar St, Cambridge, MA 02139, USA", "42.36194070", "-71.09043780", "edu", "", "United States", "2018"], ["Identifying implementation bugs in machine learning based image classifiers using metamorphic testing", "", "India", "India", "India", "20.59368400", "78.96288000", "edu", "", "", "2018"], ["Semantic Segmentation , Urban Navigation , and Research Directions", "", "Princeton University", "Princeton University", "Lot 9, University Place, Princeton Township, Mercer County, New Jersey, 08540, USA", "40.34829285", "-74.66308325", "edu", "", "United States", "2018"], ["Implementation of human-robot VQA interaction system with dynamic memory networks", "School of Electrical Engineering, KAIST, Daejeon, Republic of Korea", "KAIST", "KAIST", "291 Daehak-ro, Eoeun-dong, Yuseong-gu, Daejeon, South Korea", "36.37214270", "127.36039000", "edu", "", "South Korea", "2017"], ["Adversarial Cross-Modal Retrieval", "University of Electronic Science and Technology of China, Chengdu, China", "University of Electronic Science and Technology of China", "University of Electronic Science and Technology of China", "Columbus, OH 43210, USA", "40.01419050", "-83.03091430", "edu", "", "United States", "2017"], ["Data Analysis Project : Using Knowledge Graphs for Image Classification", "", "Carnegie Mellon University", "Carnegie Mellon University", "Carnegie Mellon University Silicon Valley, South Akron Road, ARC, Santa Clara County, California, 94035-0016, USA", "37.41021930", "-122.05965487", "edu", "", "United States", "2018"], ["Structure Inference Net: Object Detection Using Scene-Level Context and Instance-Level Relationships", "", "University of Chinese Academy of Sciences", "University of Chinese Academy of Sciences", "University of Chinese Academy of Sciences, UCAS, Yuquanlu, \u7389\u6cc9\u8def, \u7530\u6751, \u6d77\u6dc0\u533a, 100049, \u4e2d\u56fd", "39.90828040", "116.24585270", "edu", "", "China", "2018"], ["Statistical Iterative CBCT Reconstruction Based on Neural Network", "Key Laboratory of Image Processing and Intelligent Control of Ministry of Education of China, Huazhong University of Science and Technology, Wuhan, China", "Huazhong University of Science and Technology", "Huazhong University of Science and Technology", "\u534e\u4e2d\u5927, \u73de\u55bb\u8def, \u4e1c\u6e56\u65b0\u6280\u672f\u5f00\u53d1\u533a, \u5173\u4e1c\u8857\u9053, \u4e1c\u6e56\u65b0\u6280\u672f\u5f00\u53d1\u533a\uff08\u6258\u7ba1\uff09, \u6d2a\u5c71\u533a (Hongshan), \u6b66\u6c49\u5e02, \u6e56\u5317\u7701, 430074, \u4e2d\u56fd", "30.50975370", "114.40628810", "edu", "", "China", "2018"], ["Fusion Scheme for Semantic and Instance-level Segmentation", "Computer Science Department, Technical University of Cluj-Napoca, Image Processing and Pattern Recognition Group, Romania", "Technical University of Cluj-Napoca", "Technical University of Cluj-Napoca", "Strada Memorandumului 28, Cluj-Napoca 400114, Romania", "46.76929900", "23.58561300", "edu", "", "Romania", "2018"], ["Where and Who? Automatic Semantic-Aware Person Composition", "", "University of Virginia", "University of Virginia", "University of Virginia, Rotunda Alley, Carr's Hill, Albemarle County, Virginia, 22904-4119, USA", "38.03536820", "-78.50353220", "edu", "", "United States", "2018"], ["Findings of the Second Shared Task on Multimodal Machine Translation and Multilingual Image Description", "", "University of Edinburgh", "University of Edinburgh", "New College, New College Courtyard, The Mound, Old Town, Edinburgh, City of Edinburgh, Scotland, EH1 2LX, UK", "55.94951105", "-3.19534913", "edu", "", "United Kingdom", "2017"], ["Learning to predict where to look in interactive environments using deep recurrent q-learning", "", "Iran", "Iran", "Iran", "32.42790800", "53.68804600", "edu", "", "Iran", "2016"], ["EmotioNet Challenge: Recognition of facial expressions of emotion in the wild", "", "Ohio State University", "The Ohio State University", "The Ohio State University, Woody Hayes Drive, Columbus, Franklin County, Ohio, 43210, USA", "40.00471095", "-83.02859368", "edu", "", "United States", "2017"], ["EMPIRICAL PERFORMANCE UPPER BOUNDS FOR IM- AGE AND VIDEO CAPTIONING", "", "New York University", "New York University", "NYU, West 4th Street, NoHo Historic District, NoHo, Manhattan, Manhattan Community Board 2, New York County, NYC, New York, 10012, USA", "40.72925325", "-73.99625394", "edu", "", "United States", "2016"], ["Automatic Annotation of Object Instances by Region-Based Recurrent Neural Networks", "Faculty of Electronics, Telecommunications and Information Technology, University Politehnica of Bucharest, Bucharest, 061071, Romania", "University Politehnica of Bucharest", "University Politehnica of Bucharest", "Universitatea Politehnica din Bucure\u0219ti, Novum Invest, Bucure\u0219ti, Militari, Sector 6, Municipiul Bucure\u0219ti, 060042, Rom\u00e2nia", "44.43918115", "26.05044565", "edu", "", "Romania", "2018"], ["Perceptual Material Attributes Arise in Local Material Recognition", "", "Drexel University", "Drexel University", "Drexel University, Arch Street, Powelton Village, Philadelphia, Philadelphia County, Pennsylvania, 19104, USA", "39.95740000", "-75.19026706", "edu", "", "United States", "2016"], ["Hierarchical Co-Attention for Visual Question Answering", "", "Virginia Tech", "Virginia Tech", "Blacksburg, VA 24061, USA", "37.22838430", "-80.42341670", "edu", "", "United States", "2016"], ["Intelligent Film Assistant for Personalized Video Creation on Mobile Devices", "University of Applied Sciences, Technikum Wien, Vienna, Austria", "University of Applied Sciences", "National Kaohsiung, University of Applied Sciences, Kaohsiung, Taiwan. jspan@cc.kuas.edu.tw", "No. 415\u865f, Jiangong Road, Sanmin District, Kaohsiung City, Taiwan 807", "22.64894580", "120.32831570", "edu", "", "Taiwan", "2017"], ["Crowd Counting via Scale-Adaptive Convolutional Neural Network", "", "Shanghai Jiaotong University", "Shanghai Jiaotong University", "China, Shanghai, Minhang, \u4e1c\u5ddd\u8def \u90ae\u653f\u7f16\u7801: 200240", "31.02522010", "121.43377840", "edu", "", "China", "2018"], ["Action Machine: Rethinking Action Recognition in Trimmed Videos", "", "University of Chinese Academy of Sciences", "University of Chinese Academy of Sciences", "University of Chinese Academy of Sciences, UCAS, Yuquanlu, \u7389\u6cc9\u8def, \u7530\u6751, \u6d77\u6dc0\u533a, 100049, \u4e2d\u56fd", "39.90828040", "116.24585270", "edu", "", "China", "2018"], ["S4Net: Single Stage Salient-Instance Segmentation", "", "Nankai University", "Nankai University", "94 Weijin Rd, Nankai Qu, China, 300071", "39.10394430", "117.17422320", "edu", "", "", "2017"], ["Answerer in Questioner's Mind for Goal-Oriented Visual Dialogue", "", "Seoul National University", "Seoul National University", "\uc11c\uc6b8\ub300\ud559\uad50, \uc11c\ud638\ub3d9\ub85c, \uc11c\ub454\ub3d9, \uad8c\uc120\uad6c, \uc218\uc6d0\uc2dc, \uacbd\uae30, 16614, \ub300\ud55c\ubbfc\uad6d", "37.26728000", "126.98411510", "edu", "", "South Korea", "2017"], ["Beyond Manual Annotations for Learning Visual Representations", "", "University of California, Berkeley", "University of California, Berkeley", "Berkeley Art Museum and Pacific Film Archive, Bancroft Way, Southside, Berkeley, Alameda County, California, 94720-1076, USA", "37.86871260", "-122.25586815", "edu", "", "United States", "2016"], ["Deep Neural Networks for Semantic Segmentation of Multispectral Remote Sensing Imagery", "", "Rochester Institute of Technology", "Rochester Institute of Technology", "Rochester Institute of Technology (RIT), 1, Lomb Memorial Drive, Bailey, Henrietta Town, Monroe County, New York, 14623, USA", "43.08250655", "-77.67121663", "edu", "", "United States", "2017"], ["Best of Both Worlds: Transferring Knowledge from Discriminative Learning to a Generative Visual Dialog Model", "", "Georgia Institute of Technology", "Georgia Institute of Technology", "Georgia Tech, Atlantic Drive Northwest, Bellwood, Rockdale, Atlanta, Fulton County, Georgia, 30318, USA", "33.77603300", "-84.39884086", "edu", "", "United States", "2017"], ["A vision-grounded dataset for predicting typical locations for verbs", "", "University of California at Berkeley", "International Computer Science Institute, University of California at Berkeley, Berkeley, USA", "1947 Center St, Berkeley, CA 94704, USA", "37.87015430", "-122.27123120", "edu", "", "United States", "2018"], ["Leveraging Motion Priors in Videos for Improving Human Segmentation", "", "National Tsing Hua University", "National Tsing Hua University", "\u570b\u7acb\u6e05\u83ef\u5927\u5b78, 101, \u514b\u606d\u6a4b, \u5149\u660e\u91cc, \u8d64\u571f\u5d0e, \u6771\u5340, \u65b0\u7af9\u5e02, 30013, \u81fa\u7063", "24.79254840", "120.99511830", "edu", "", "Taiwan", "2018"], ["Shape and Pose Estimation for Closely Interacting Persons Using Multi-view Images", "", "Tianjin University", "Tianjin University", "\u6cf0\u5c71\u822a\u7a7a\u6e2f/\u5929\u6d25\u5927\u53a6, \u67a3\u884c\u8def, \u67a3\u884c \u9ad8\u738b\u5bfa, \u957f\u57ce\u8def, \u5927\u6cb3, \u5cb1\u5cb3\u533a (Daiyue), \u6cf0\u5b89\u5e02, \u5c71\u4e1c\u7701, 271000, \u4e2d\u56fd", "36.20304395", "117.05842113", "edu", "", "China", "2018"], ["Quantization and Training of Neural Networks for Efficient Integer-Arithmetic-Only Inference", "", "Google", "Google, Inc.", "1600 Amphitheatre Pkwy, Mountain View, CA 94043, USA", "37.42199990", "-122.08405750", "company", "Google, Mountain View, CA", "United States", "2018"], ["Gibson Env: Real-World Perception for Embodied Agents", "", "University of California, Berkeley", "University of California, Berkeley", "Berkeley Art Museum and Pacific Film Archive, Bancroft Way, Southside, Berkeley, Alameda County, California, 94720-1076, USA", "37.86871260", "-122.25586815", "edu", "", "United States", "2018"], ["Explaining the Ambiguity of Object Detection and 6D Pose from Visual Data", "", "University of Oxford", "University of Oxford", "Radcliffe Camera, Radcliffe Square, Grandpont, Oxford, Oxon, South East, England, OX1 4AJ, UK", "51.75345380", "-1.25400997", "edu", "", "United Kingdom", "2018"], ["AutoFocus: Efficient Multi-Scale Inference", "", "University of Maryland", "University of Maryland", "The Grand Garage, 5, North Paca Street, Seton Hill, Baltimore, Maryland, 21201, USA", "39.28996850", "-76.62196103", "edu", "", "United States", "2018"], ["Large-Scale Active Learning with Approximations of Expected Model Output Changes", "", "Friedrich Schiller University Jena", "Computer Vision Group, Friedrich Schiller University Jena, Germany", "Ernst-Abbe-Platz 2, 07743 Jena, Germany", "50.92776710", "11.58217290", "edu", "", "Germany", "2016"], ["Multi-modal deep feature learning for RGB-D object detection", "", "University of Rochester", "University of Rochester", "Memorial Art Gallery, 500, University Avenue, East End, Rochester, Monroe County, New York, 14607, USA", "43.15769690", "-77.58829158", "edu", "", "United States", "2017"], ["Beyond Grids : Learning Graph Representations for Visual Recognition", "", "Carnegie Mellon University", "Carnegie Mellon University", "Carnegie Mellon University Silicon Valley, South Akron Road, ARC, Santa Clara County, California, 94035-0016, USA", "37.41021930", "-122.05965487", "edu", "", "United States", "2018"], ["ALFA: Agglomerative Late Fusion Algorithm for Object Detection", "Institute of Computational Mathematics and Information Technologies, Kazan Federal University, Russia", "Czech Technical University", "Czech Technical University", "\u010cesk\u00e9 vysok\u00e9 u\u010den\u00ed technick\u00e9 v Praze, Resslova, Nov\u00e9 M\u011bsto, Praha, okres Hlavn\u00ed m\u011bsto Praha, Hlavn\u00ed m\u011bsto Praha, Praha, 11121, \u010cesko", "50.07642960", "14.41802312", "edu", "", "Czech Republic", "2018"], ["Question Type Guided Attention in Visual Question Answering", "", "California Institute of Technology", "California Institute of Technology", "California Institute of Technology, San Pasqual Walk, Madison Heights, Pasadena, Los Angeles County, California, 91126, USA", "34.13710185", "-118.12527487", "edu", "", "United States", "2018"], ["Unsupervised Domain Adaptation for Semantic Segmentation with GANs", "", "GE Global Research Center", "GE Global Research Center", "GE Global Research Center, Aqueduct, Niskayuna, Schenectady County, New York, USA", "42.82982480", "-73.87719385", "edu", "", "United States", "2017"], ["Unsupervised Ensemble Regression", "", "IBM Thomas J. Watson Research Center", "IBM Thomas J. Watson Research Center", "IBM Yorktown research lab, Adams Road, Millwood, Town of New Castle, Westchester County, New York, 10562, USA", "41.21002475", "-73.80407056", "company", "", "United States", "2017"], ["Dockerface: an easy to install and use Faster R-CNN face detector in a Docker container", "", "Georgia Institute of Technology", "Georgia Institute of Technology", "Georgia Tech, Atlantic Drive Northwest, Bellwood, Rockdale, Atlanta, Fulton County, Georgia, 30318, USA", "33.77603300", "-84.39884086", "edu", "", "United States", "2017"], ["Integrating Local Material Recognition with Large-Scale Perceptual Attribute Discovery", "", "Drexel University", "Drexel University", "Drexel University, Arch Street, Powelton Village, Philadelphia, Philadelphia County, Pennsylvania, 19104, USA", "39.95740000", "-75.19026706", "edu", "", "United States", "2016"], ["Approximate Distribution Matching for Sequence-to-Sequence Learning", "", "Microsoft Research Asia", "Microsoft Research Asia", "1 Memorial Dr, Cambridge, MA 02142, USA", "42.36142560", "-71.08120920", "company", "", "United States", "2018"], ["Webly Supervised Learning of Convolutional Networks", "", "Carnegie Mellon University", "Carnegie Mellon University", "Carnegie Mellon University Silicon Valley, South Akron Road, ARC, Santa Clara County, California, 94035-0016, USA", "37.41021930", "-122.05965487", "edu", "", "United States", "2015"], ["Action-driven 3D indoor scene evolution", "", "Microsoft", "Microsoft Corporation, Redmond, WA, USA", "One Microsoft Way, Redmond, WA 98052, USA", "47.64233180", "-122.13693020", "company", "", "United States", "2016"], ["Pedestrian Detection by Feature Selected Self-Similarity Features", "National Key Laboratory of Science and Technology on Communications, University of Electronic Science and Technology of China, Chengdu, China", "University of Electronic Science and Technology of China", "University of Electronic Science and Technology of China", "Columbus, OH 43210, USA", "40.01419050", "-83.03091430", "edu", "", "United States", "2018"], ["Multiple Instance Learning Convolutional Neural Networks for object recognition", "", "University of Missouri", "University of Missouri", "L1, Maguire Boulevard, Lemone Industrial Park, Columbia, Boone County, Missouri, 65201, USA", "38.92676100", "-92.29193783", "edu", "", "United States", "2016"], ["Amodal Instance Segmentation", "", "University of California, Berkeley", "University of California, Berkeley", "Berkeley Art Museum and Pacific Film Archive, Bancroft Way, Southside, Berkeley, Alameda County, California, 94720-1076, USA", "37.86871260", "-122.25586815", "edu", "", "United States", "2016"], ["Dictionary-Guided Editing Networks for Paraphrase Generation", "", "Beihang University", "Beihang University", "\u5317\u4eac\u822a\u7a7a\u822a\u5929\u5927\u5b66, 37, \u5b66\u9662\u8def, \u4e94\u9053\u53e3, \u540e\u516b\u5bb6, \u6d77\u6dc0\u533a, 100083, \u4e2d\u56fd", "39.98083330", "116.34101249", "edu", "", "China", "2018"], ["Improving Image Captioning by Leveraging Knowledge Graphs", "", "The Pennsylvania State University", "The Pennsylvania State University", "Old Main, State College, PA 16801, USA", "40.79821330", "-77.85990840", "edu", "", "United States", "2019"], ["Ex Paucis Plura : Learning Affordance Segmentation from Very Few Examples", "", "University of Bonn", "University of Bonn", "Rheinische Friedrich-Wilhelms-Universit\u00e4t Bonn, Arkadenhof, Bonn-Zentrum, Stadtbezirk Bonn, Bonn, Regierungsbezirk K\u00f6ln, Nordrhein-Westfalen, 53113, Deutschland", "50.73381240", "7.10224650", "edu", "", "Germany", "2018"], ["Story Understanding in Video Advertisements", "", "University of Pittsburgh", "University of Pittsburgh", "University of Pittsburgh, Sutherland Drive, West Oakland, PGH, Allegheny County, Pennsylvania, 15240, USA", "40.44415295", "-79.96243993", "edu", "", "United States", "2018"], ["Prototype GOD: prototype Generic Objects Dataset for an Object Detection System based on Bird\u2019s \u2013Eye View", "Visual Intelligence Research Group Electronics and Telecommunications Research Institute, Daejeon, Korea", "Electronics and Telecommunications Research Institute, Korea", "Electronics and Telecommunications Research Institute (ETRI), Republic of Korea", "South Korea", "35.90775700", "127.76692200", "edu", "", "South Korea", "2018"], ["A Multi-Stream Convolutional Neural Network Framework for Group Activity Recognition", "", "Iran", "Iran", "Iran", "32.42790800", "53.68804600", "edu", "", "Iran", "2018"], ["Peephole: Predicting Network Performance Before Training", "", "Chinese University of Hong Kong", "Chinese University of Hong Kong", "Hong Kong, \u99ac\u6599\u6c34\u6c60\u65c1\u8def", "22.41626320", "114.21093180", "edu", "", "China", "2017"], ["AutoMarkov DNNs for object classification", "University Politehnica of Bucharest, Faculty of Electronics, Telecommunications and Information Technology, Applied Electronics and Information Engineering Department, 1-3, Iuliu Maniu Ave., Romania 061071", "University Politehnica of Bucharest", "University Politehnica of Bucharest", "Universitatea Politehnica din Bucure\u0219ti, Novum Invest, Bucure\u0219ti, Militari, Sector 6, Municipiul Bucure\u0219ti, 060042, Rom\u00e2nia", "44.43918115", "26.05044565", "edu", "", "Romania", "2016"], ["Aggregated Residual Transformations for Deep Neural Networks", "", "UC San Diego", "UC San Diego", "9500 Gilman Dr, La Jolla, CA 92093, USA", "32.88006040", "-117.23401350", "edu", "", "United States", "2017"], ["Looking deeper and transferring attention for image captioning", "Shanghai Engineering Research Center of Industrial Vision Perception & Intelligent Computing, Shanghai, China", "Shanghai Engineering Research Center of Industrial Vision Perception & Intelligent Computing, Shanghai, China", "Shanghai Engineering Research Center of Industrial Vision Perception & Intelligent Computing, Shanghai, China", "Shanghai, China", "31.23039040", "121.47370210", "edu", "", "China", "2018"], ["Evaluating ResNeXt Model Architecture for Image Classification", "", "University of Waterloo", "University of Waterloo", "University of Waterloo, 200, University Avenue West, Northdale, Beechwood, Waterloo, Regional Municipality of Waterloo, Ontario, N2L 3G1, Canada", "43.47061295", "-80.54724732", "edu", "", "Canada", "2018"], ["Robot Classification of Human Interruptibility and a Study of Its Effects", "Georgia Institute of Technology, Atlanta, GA", "Georgia Institute of Technology", "Georgia Institute of Technology", "Georgia Tech, Atlantic Drive Northwest, Bellwood, Rockdale, Atlanta, Fulton County, Georgia, 30318, USA", "33.77603300", "-84.39884086", "edu", "", "United States", "2018"], ["Fake Sentence Detection as a Training Task for Sentence Encoding", "", "Stony Brook University", "Stony Brook University", "Stony Brook University, 100, Nicolls Road, Stony Brook, Suffolk County, New York, 11794, USA", "40.91531960", "-73.12706260", "edu", "", "United States", "2018"], ["Decoupled Novel Object Captioner", "", "Chinese Academy of Sciences", "Chinese Academy of Sciences", "\u4e2d\u56fd\u79d1\u5b66\u9662\u5fc3\u7406\u7814\u7a76\u6240, 16, \u6797\u8403\u8def, \u671d\u9633\u533a / Chaoyang, \u5317\u4eac\u5e02, 100101, \u4e2d\u56fd", "40.00447950", "116.37023800", "edu", "", "China", "2018"], ["ScratchDet : Training Single-Shot Object Detectors from Scratch", "", "University of Chinese Academy of Sciences", "University of Chinese Academy of Sciences", "University of Chinese Academy of Sciences, UCAS, Yuquanlu, \u7389\u6cc9\u8def, \u7530\u6751, \u6d77\u6dc0\u533a, 100049, \u4e2d\u56fd", "39.90828040", "116.24585270", "edu", "", "China", "2018"], ["The Emotional Impact of Audio-Visual Stimuli", "", "Rochester Institute of Technology", "Rochester Institute of Technology", "Rochester Institute of Technology (RIT), 1, Lomb Memorial Drive, Bailey, Henrietta Town, Monroe County, New York, 14623, USA", "43.08250655", "-77.67121663", "edu", "", "United States", "2018"], ["Question action relevance and editing for visual question answering", "Dipartimento di Informatica, Universit\u00e0 di Salerno, Fisciano, Italy", "Dipartimento di Informatica, Universit\u00e0 di Salerno, Fisciano, Italy", "Dipartimento di Informatica, Universit\u00e0 di Salerno, Fisciano, Italy", "Universit\u00e0 di Salerno Via Papa, Via Giovanni Paolo II, 132, 84084 Fisciano SA, Italy", "40.77434920", "14.78901500", "edu", "", "Italy", "2018"], ["Cross Modal Distillation for Supervision Transfer", "", "University of California, Berkeley", "University of California, Berkeley", "Berkeley Art Museum and Pacific Film Archive, Bancroft Way, Southside, Berkeley, Alameda County, California, 94720-1076, USA", "37.86871260", "-122.25586815", "edu", "", "United States", "2016"], ["Hot Anchors: A Heuristic Anchors Sampling Method in RCNN-Based Object Detection", "", "University of Chinese Academy of Sciences", "University of Chinese Academy of Sciences", "University of Chinese Academy of Sciences, UCAS, Yuquanlu, \u7389\u6cc9\u8def, \u7530\u6751, \u6d77\u6dc0\u533a, 100049, \u4e2d\u56fd", "39.90828040", "116.24585270", "edu", "", "China", "2018"], ["HiDDeN: Hiding Data With Deep Networks", "", "Stanford University", "Stanford University", "Stanford University, Memorial Way, Stanford, Santa Clara County, California, 94305-6015, USA", "37.43131385", "-122.16936535", "edu", "", "United States", "2018"], ["Spatial-Aware Object Embeddings for Zero-Shot Localization and Classification of Actions", "", "University of Amsterdam", "University of Amsterdam", "Institute for Logic, Language and Computation (ILLC), 107, Science Park, Oost-Watergraafsmeer, Amsterdam, Oost, Amsterdam, Noord-Holland, Nederland, 1098XG, Nederland", "52.35536550", "4.95016440", "edu", "", "Netherlands", "2017"], ["Subitizing with Variational Autoencoders", "", "University of Amsterdam", "University of Amsterdam", "Institute for Logic, Language and Computation (ILLC), 107, Science Park, Oost-Watergraafsmeer, Amsterdam, Oost, Amsterdam, Noord-Holland, Nederland, 1098XG, Nederland", "52.35536550", "4.95016440", "edu", "", "Netherlands", "2018"], ["PoseTrack: Joint Multi-person Pose Estimation and Tracking", "", "University of Adelaide", "University of Adelaide", "University of Adelaide, North Terrace, Adelaide, 5000, City of Adelaide, South Australia, 5000, Australia", "-34.91892260", "138.60423668", "edu", "", "Australia", "2017"], ["Fast, Diverse and Accurate Image Captioning Guided By Part-of-Speech", "", "University of Illinois, Urbana-Champaign", "University of Illinois, Urbana-Champaign", "B-3, South Mathews Avenue, Urbana, Champaign County, Illinois, 61801, USA", "40.11116745", "-88.22587665", "edu", "", "United States", "2018"], ["Answer-Type Prediction for Visual Question Answering", "", "Rochester Institute of Technology", "Rochester Institute of Technology", "Rochester Institute of Technology (RIT), 1, Lomb Memorial Drive, Bailey, Henrietta Town, Monroe County, New York, 14623, USA", "43.08250655", "-77.67121663", "edu", "", "United States", "2016"], ["Semantic Image Segmentation via Deep Parsing Network", "", "Chinese University of Hong Kong", "Chinese University of Hong Kong", "Hong Kong, \u99ac\u6599\u6c34\u6c60\u65c1\u8def", "22.41626320", "114.21093180", "edu", "", "China", "2015"], ["Bird Species Classification using Transfer Learning with Multistage Training", "", "India", "India", "India", "20.59368400", "78.96288000", "edu", "", "", "2018"], ["Traits & Transferability of Adversarial Examples against Instance Segmentation & Object Detection", "", "University of Illinois, Urbana-Champaign", "University of Illinois, Urbana-Champaign", "B-3, South Mathews Avenue, Urbana, Champaign County, Illinois, 61801, USA", "40.11116745", "-88.22587665", "edu", "", "United States", "2018"], ["Hierarchical Recurrent Neural Encoder for Video Representation with Application to Captioning", "", "University of Technology Sydney", "University of Technology Sydney", "University of Technology Sydney, Omnibus Lane, Ultimo, Sydney, NSW, 2007, Australia", "-33.88096510", "151.20107299", "edu", "", "Australia", "2016"], ["Self-Contained Stylization via Steganography for Reverse and Serial Style Transfer", "", "National Chiao Tung University", "National Chiao Tung University", "NCTU;\u4ea4\u5927;\u4ea4\u901a\u5927\u5b78;\u4ea4\u5927\u5149\u5fa9\u6821\u5340;\u4ea4\u901a\u5927\u5b78\u5149\u5fa9\u6821\u5340, 1001, \u5927\u5b78\u8def, \u5149\u660e\u91cc, \u8d64\u571f\u5d0e, \u6771\u5340, \u65b0\u7af9\u5e02, 30010, \u81fa\u7063", "24.78676765", "120.99724412", "edu", "", "Taiwan", "2018"], ["Improving Fast Segmentation With Teacher-Student Learning", "", "Nanyang Technological University", "Nanyang Technological University", "NTU, Faculty Avenue, Jurong West, Southwest, 637460, Singapore", "1.34841040", "103.68297965", "edu", "", "Singapore", "2018"], ["Describing Natural Images Containing Novel Objects with Knowledge Guided Assitance", "", "Karlsruhe Institute of Technology", "Karlsruhe Institute of Technology", "KIT, Leopoldshafener Allee, Linkenheim, Linkenheim-Hochstetten, Landkreis Karlsruhe, Regierungsbezirk Karlsruhe, Baden-W\u00fcrttemberg, 76351, Deutschland", "49.10184375", "8.43312560", "edu", "", "Germany", "2017"], ["Do deep features retrieve X ? : A tool for quick inspection of deep visual similarities", "", "University of British Columbia", "University of British Columbia", "University of British Columbia, Eagles Drive, Hawthorn Place, University Endowment Lands, Metro Vancouver, British Columbia, V6T, Canada", "49.25839375", "-123.24658161", "edu", "", "Canada", "2015"], ["The Middle Child Problem: Revisiting Parametric Min-Cut and Seeds for Object Proposals", "", "Oregon State University", "Oregon State University", "OSU Beaver Store, 538, Southwest 6th Avenue, Portland Downtown, Portland, Multnomah County, Oregon, 97204, USA", "45.51982890", "-122.67797964", "edu", "", "United States", "2015"], ["The Unreasonable Effectiveness of Noisy Data for Fine-Grained Recognition", "", "Stanford University", "Stanford University", "Stanford University, Memorial Way, Stanford, Santa Clara County, California, 94305-6015, USA", "37.43131385", "-122.16936535", "edu", "", "United States", "2016"], ["Traffic-Sign Detection and Classification in the Wild", "", "Beijing, China", "Beijing, China", "Beijing, China", "39.90419990", "116.40739630", "edu", "", "China", "2016"], ["Progressively Diffused Networks for Semantic Image Segmentation", "", "SenseTime", "SenseTime", "China, Beijing Shi, Haidian Qu, WuDaoKou, Zhongguancun E Rd, 1\u53f7-7", "39.99300800", "116.32988200", "company", "1 Zhongguancun E Rd, Haidian Qu, China", "China", "2017"], ["Subspace Alignment Based Domain Adaptation for RCNN Detector", "", "IIT Kanpur", "IIT Kanpur", "Kalyanpur, Kanpur, Uttar Pradesh 208016, India", "26.51233880", "80.23290000", "edu", "", "India", "2015"], ["Segment-Phrase Table for Semantic Segmentation, Visual Entailment and Paraphrasing", "", "University of Washington", "University of Washington", "University of Washington, Rainier Vista, Montlake, University District, Seattle, King County, Washington, 98195, USA", "47.65432380", "-122.30800894", "edu", "", "United States", "2015"], ["Towards High Performance Video Object Detection for Mobiles", "", "Microsoft Research Asia", "Microsoft Research Asia", "1 Memorial Dr, Cambridge, MA 02142, USA", "42.36142560", "-71.08120920", "company", "", "United States", "2018"], ["Loss Functions for Multiset Prediction", "", "New York University", "New York University", "NYU, West 4th Street, NoHo Historic District, NoHo, Manhattan, Manhattan Community Board 2, New York County, NYC, New York, 10012, USA", "40.72925325", "-73.99625394", "edu", "", "United States", "2018"], ["Fast Online Object Tracking and Segmentation: A Unifying Approach", "", "University of Oxford", "University of Oxford", "Radcliffe Camera, Radcliffe Square, Grandpont, Oxford, Oxon, South East, England, OX1 4AJ, UK", "51.75345380", "-1.25400997", "edu", "", "United Kingdom", "2018"], ["Looking for ELMo's friends: Sentence-Level Pretraining Beyond Language Modeling.", "", "Johns Hopkins University", "Johns Hopkins University", "Baltimore, MD 21218, USA", "39.32990130", "-76.62051770", "edu", "", "", "2018"], ["Transferable Semi-Supervised Semantic Segmentation", "", "Beckman Institute", "Beckman Institute", "Beckman Institute, The Presidents' Walk, Urbana, Champaign County, Illinois, 61801-2341, USA", "40.11571585", "-88.22750772", "edu", "", "United States", "2018"], ["Multi-modal Capsule Routing for Actor and Action Video Segmentation Conditioned on Natural Language Queries", "", "University of Central Florida", "University of Central Florida", "University of Central Florida, Libra Drive, University Park, Orange County, Florida, 32816, USA", "28.59899755", "-81.19712501", "edu", "", "United States", "2018"], ["Enhancement of SSD by concatenating feature maps for object detection.", "", "Seoul National University", "Seoul National University", "\uc11c\uc6b8\ub300\ud559\uad50, \uc11c\ud638\ub3d9\ub85c, \uc11c\ub454\ub3d9, \uad8c\uc120\uad6c, \uc218\uc6d0\uc2dc, \uacbd\uae30, 16614, \ub300\ud55c\ubbfc\uad6d", "37.26728000", "126.98411510", "edu", "", "South Korea", "2017"], ["Generation with Recursive Neural Networks", "", "Stanford University", "Stanford University", "Stanford University, Memorial Way, Stanford, Santa Clara County, California, 94305-6015, USA", "37.43131385", "-122.16936535", "edu", "", "United States", "2016"], ["Active learning and discovery of object categories in the presence of unnameable instances", "Computer Vision Group, Friedrich Schiller University Jena, Germany", "Friedrich Schiller University Jena", "Computer Vision Group, Friedrich Schiller University Jena, Germany", "Ernst-Abbe-Platz 2, 07743 Jena, Germany", "50.92776710", "11.58217290", "edu", "", "Germany", "2015"], ["Ambiguity Helps: Classification with Disagreements in Crowdsourced Annotations", "", "Harvard University", "Harvard University", "Harvard University, Soldiers Field Road, Allston, Boston, Suffolk County, Massachusetts, 02163, USA", "42.36782045", "-71.12666653", "edu", "", "United States", "2016"], ["Spott: On-the-Spot e-Commerce for Television Using Deep Learning-Based Video Analysis Techniques", "Ghent University - imec, ELIS - IDLab, Pietersnieuwstraat, Ghent", "Ghent University", "Ghent University", "St. Pietersnieuwstraat 33, 9000 Gent, Belgium", "51.04656190", "3.72791810", "edu", "", "Belgium", "2017"], ["Improving Multi-Person Pose Estimation using Label Correction", "", "Keio University", "Keio University", "\u7db1\u5cf6\u5e02\u6c11\u306e\u68ee, \u3051\u3064\u308f\u308a\u5742, \u6e2f\u5317\u533a, \u6a2a\u6d5c\u5e02, \u795e\u5948\u5ddd\u770c, \u95a2\u6771\u5730\u65b9, 223-0053, \u65e5\u672c", "35.54169690", "139.63471840", "edu", "", "Japan", "2018"], ["A Focused Dynamic Attention Model for Visual Question Answering", "", "National University of Singapore", "National University of Singapore", "NUS, Former 1936 British Outpost, Nepal Hill, Clementi, Southwest, 117542, Singapore", "1.29620180", "103.77689944", "edu", "", "Singapore", "2016"], ["Solving Visual Madlibs with Multiple Cues", "", "University of Illinois, Urbana-Champaign", "University of Illinois, Urbana-Champaign", "B-3, South Mathews Avenue, Urbana, Champaign County, Illinois, 61801, USA", "40.11116745", "-88.22587665", "edu", "", "United States", "2016"], ["Could we create a training set for image captioning using automatic translation?", "Bilgisayar Mühendisliği, Orta Doggu Teknik Üniversitesi, Ankara, Türkiye", "Bilgisayar M\u00fchendisli\u011fi, Orta Doggu Teknik \u00dcniversitesi, Ankara, T\u00fcrkiye", "Bilgisayar Mühendisliği, Orta Doggu Teknik Üniversitesi, Ankara, Türkiye", "\u00dcniversiteler Mh., 06800 \u00c7ankaya/Ankara, Turkey", "39.89183900", "32.78334710", "edu", "", "Poland", "2017"], ["Unprecedented Usage of Pre-trained CNNs on Beauty Product", "University of Malaya, Kuala Lumpur, Malaysia", "University of Malaya", "University of Malaya", "UM, Lingkaran Wawasan, Bukit Pantai, Bangsar, KL, 50603, Malaysia", "3.12267405", "101.65356103", "edu", "", "Malaysia", "2018"], ["Improved Image Captioning via Policy Gradient optimization of SPIDEr", "", "University of Oxford", "University of Oxford", "Radcliffe Camera, Radcliffe Square, Grandpont, Oxford, Oxon, South East, England, OX1 4AJ, UK", "51.75345380", "-1.25400997", "edu", "", "United Kingdom", "2017"], ["High performance and fast object detection in road environments", "DGIST", "DGIST", "DGIST", "South Korea, Daegu, Dalseong-gun, Yuga-myeon, \ud14c\ud06c\ub178\uc911\uc559\ub300\ub85c 333", "35.70528600", "128.45710200", "edu", "", "South Korea", "2017"], ["Object Recognition Based on Amounts of Unlabeled Data", "", "Beijing Institute of Technology", "Beijing Institute of Technology University", "\u5317\u4eac\u7406\u5de5\u5927\u5b66, 5, \u4e2d\u5173\u6751\u5357\u5927\u8857, \u4e2d\u5173\u6751, \u7a3b\u9999\u56ed\u5357\u793e\u533a, \u6d77\u6dc0\u533a, \u5317\u4eac\u5e02, 100872, \u4e2d\u56fd", "39.95866520", "116.30971281", "edu", "", "China", "2016"], ["Multi-Label Music Genre Classification from Audio, Text and Images Using Deep Features", "", "Universitat Pompeu Fabra", "Universitat Pompeu Fabra", "Dip\u00f2sit de les Aig\u00fces, Carrer de Wellington, la Vila Ol\u00edmpica del Poblenou, Ciutat Vella, Barcelona, BCN, CAT, 08071, Espa\u00f1a", "41.39044285", "2.18891949", "edu", "", "Spain", "2017"], ["Zero-Shot Detection", "", "Boston University", "Boston University", "BU, Bay State Road, Fenway, Boston, Suffolk County, Massachusetts, 02215, USA", "42.35042530", "-71.10056114", "edu", "", "United States", "2018"], ["What are the Visual Features Underlying Human Versus Machine Vision?", "", "Brown University", "Brown University", "Brown University, Waterman Street, College Hill, Providence, Bristol, Rhode Island, 02912, USA", "41.82686820", "-71.40123146", "edu", "", "United States", "2017"], ["Material Recognition from Local Appearance in Global Context", "", "Drexel University", "Drexel University", "Drexel University, Arch Street, Powelton Village, Philadelphia, Philadelphia County, Pennsylvania, 19104, USA", "39.95740000", "-75.19026706", "edu", "", "United States", "2016"], ["Complex Object Classification: A Multi-Modal Multi-Instance Multi-Label Deep Network with Optimal Transport", "Nanjing University, Nanjing, China", "Nanjing University", "Nanjing University", "NJU, \u4e09\u6c5f\u8def, \u9f13\u697c\u533a, \u5357\u4eac\u5e02, \u6c5f\u82cf\u7701, 210093, \u4e2d\u56fd", "32.05659570", "118.77408833", "edu", "", "China", "2018"], ["What's the point: Semantic segmentation with point supervision", "", "University of Edinburgh", "University of Edinburgh", "New College, New College Courtyard, The Mound, Old Town, Edinburgh, City of Edinburgh, Scotland, EH1 2LX, UK", "55.94951105", "-3.19534913", "edu", "", "United Kingdom", "2016"], ["Extreme Clicking for Efficient Object Annotation", "", "University of Edinburgh", "University of Edinburgh", "New College, New College Courtyard, The Mound, Old Town, Edinburgh, City of Edinburgh, Scotland, EH1 2LX, UK", "55.94951105", "-3.19534913", "edu", "", "United Kingdom", "2017"], ["Visual Question Answering with Memory-Augmented Networks", "", "University of Adelaide", "University of Adelaide", "University of Adelaide, North Terrace, Adelaide, 5000, City of Adelaide, South Australia, 5000, Australia", "-34.91892260", "138.60423668", "edu", "", "Australia", "2018"], ["Data Augmentation for Cnn-Based People Detection in Aerial Images", "Department of Information Engineering and Computer Science, Feng Chia University, Taiwan", "Feng Chia University", "Feng Chia University", "\u9022\u7532\u5927\u5b78, 100, \u6587\u83ef\u8def, \u897f\u5e73\u91cc, \u897f\u5c6f\u5340, \u81fa\u4e2d\u5e02, 40724, \u81fa\u7063", "24.18005755", "120.64836072", "edu", "", "Taiwan", "2018"], ["Deep correlation for matching images and text", "Centre for Vision, Speech and Signal Processing, University of Surrey, Guildford, United Kingdom, GU2 7XH", "University of Surrey", "University of Surrey", "University of Surrey, Spine Road, Guildford Park, Guildford, Surrey, South East, England, GU2 7XH, UK", "51.24303255", "-0.59001382", "edu", "", "United Kingdom", "2015"], ["Recurrent Models for Situation Recognition", "", "University of Illinois, Urbana-Champaign", "University of Illinois, Urbana-Champaign", "B-3, South Mathews Avenue, Urbana, Champaign County, Illinois, 61801, USA", "40.11116745", "-88.22587665", "edu", "", "United States", "2017"], ["Deep Attribute-preserving Metric Learning for Natural Language Object Retrieval", "National University of Singapore, Singapore, Singapore", "National University of Singapore", "National University of Singapore", "NUS, Former 1936 British Outpost, Nepal Hill, Clementi, Southwest, 117542, Singapore", "1.29620180", "103.77689944", "edu", "", "Singapore", "2017"], ["Using Syntax to Ground Referring Expressions in Natural Images", "", "Carnegie Mellon University", "Carnegie Mellon University", "Carnegie Mellon University Silicon Valley, South Akron Road, ARC, Santa Clara County, California, 94035-0016, USA", "37.41021930", "-122.05965487", "edu", "", "United States", "2018"], ["GANtruth - an unpaired image-to-image translation method for driving scenarios", "", "KTH Royal Institute of Technology, Stockholm", "KTH Royal Institute of Technology, Stockholm", "KTH, Teknikringen, L\u00e4rkstaden, Norra Djurg\u00e5rden, \u00d6stermalms stadsdelsomr\u00e5de, Sthlm, Stockholm, Stockholms l\u00e4n, Svealand, 114 28, Sverige", "59.34986645", "18.07063213", "edu", "", "Sweden", "2018"], ["Revisiting Pre-training: An Efficient Training Method for Image Classification", "", "Beckman Institute", "Beckman Institute", "Beckman Institute, The Presidents' Walk, Urbana, Champaign County, Illinois, 61801-2341, USA", "40.11571585", "-88.22750772", "edu", "", "United States", "2018"], ["Evaluation of Segmentation Quality via Adaptive Composition of Reference Segmentations", "School of Engineering, University of California, Merced, CA", "University of California", "University of California", "Berkeley, CA, USA", "37.87189920", "-122.25853990", "edu", "", "United States", "2017"], ["Semantic Segmentation With Object Clique Potentials", "", "Chinese University of Hong Kong", "Chinese University of Hong Kong", "Hong Kong, \u99ac\u6599\u6c34\u6c60\u65c1\u8def", "22.41626320", "114.21093180", "edu", "", "China", "2015"], ["Neural Module Networks", "", "University of California, Berkeley", "University of California, Berkeley", "Berkeley Art Museum and Pacific Film Archive, Bancroft Way, Southside, Berkeley, Alameda County, California, 94720-1076, USA", "37.86871260", "-122.25586815", "edu", "", "United States", "2016"], ["ImagineNet : Style Transfer from Fine Art to Graphical User Interfaces", "", "Stanford University", "Stanford University", "Stanford University, Memorial Way, Stanford, Santa Clara County, California, 94305-6015, USA", "37.43131385", "-122.16936535", "edu", "", "United States", "2018"], ["Investigating the feature collection for semantic segmentation via single skip connection", "", "Ajou University", "Ajou University", "\uc544\uc8fc\ub300\ud559\uad50, \uc131\ud638\ub300\uad50, \uc774\uc758\ub3d9, \uc601\ud1b5\uad6c, \uc218\uc6d0\uc2dc, \uacbd\uae30, 16499, \ub300\ud55c\ubbfc\uad6d", "37.28300030", "127.04548469", "edu", "", "Korea", "2017"], ["Understanding and Controlling User Linkability in Decentralized Learning", "", "Max Planck Institute for Informatics", "Max Planck Institute for Informatics", "MPII, E1 4, Campus, Universit\u00e4t, Sankt Johann, Bezirk Mitte, Saarbr\u00fccken, Regionalverband Saarbr\u00fccken, Saarland, 66123, Deutschland", "49.25795660", "7.04577417", "edu", "", "Germany", "2018"], ["PolyMapper: Extracting City Maps using Polygons", "", "ETH Z\u00fcrich", "ETH Z\u00fcrich", "ETH Z\u00fcrich, 101, R\u00e4mistrasse, Hochschulen, Altstadt, Z\u00fcrich, Bezirk Z\u00fcrich, Z\u00fcrich, 8092, Schweiz/Suisse/Svizzera/Svizra", "47.37645340", "8.54770931", "edu", "", "Switzerland", "2018"], ["Weakly and Semi Supervised Human Body Part Parsing via Pose-Guided Knowledge Transfer", "", "University of California", "University of California", "Berkeley, CA, USA", "37.87189920", "-122.25853990", "edu", "", "United States", "2018"], ["A Fast Multi-Task CNN for Spatial Understanding of Traffic Scenes", "Institute of Control Theory and Systems Engineering, TU Dortmund University, Otto-Hahn-Str. 8, Dortmund, 44227, Germany", "TU Dortmund University", "Institute of Control Theory and Systems Engineering, TU Dortmund University, Otto-Hahn-Str. 8, Dortmund, 44227, Germany", "Emil-Figge-Stra\u00dfe 50, 44227 Dortmund, Germany", "51.49219020", "7.41413620", "edu", "", "Germany", "2018"], ["Resolving References to Objects in Photographs using the Words-As-Classifiers Model", "", "Bielefeld University", "Bielefeld University", "Fachhochschule Bielefeld FB Gestaltung, 3, Lampingstra\u00dfe, Mitte, Bielefeld, Regierungsbezirk Detmold, Nordrhein-Westfalen, 33615, Deutschland", "52.02804210", "8.51148270", "edu", "", "Germany", "2016"], ["Image Captioning with Word Level Attention", "Department of Computer Science & Technology, Tongji University, Shanghai, P. R. China", "Tongji University", "Tongji University", "\u540c\u6d4e\u5927\u5b66, 1239, \u56db\u5e73\u8def, \u6c5f\u6e7e, \u8679\u53e3\u533a, \u4e0a\u6d77\u5e02, 200092, \u4e2d\u56fd", "31.28473925", "121.49694909", "edu", "", "China", "2018"], ["Class Rectification Hard Mining for Imbalanced Deep Learning", "", "Queen Mary University of London", "Queen Mary University of London", "Queen Mary (University of London), Mile End Road, Globe Town, Mile End, London Borough of Tower Hamlets, London, Greater London, England, E1 4NS, UK", "51.52472720", "-0.03931035", "edu", "", "United Kingdom", "2017"], ["Learning deep structured network for weakly supervised change detection", "", "University of Western Australia", "University of Western Australia", "UWA, 35, Underwood Avenue, Daglish, Perth, Western Australia, 6009, Australia", "-31.95040445", "115.79790037", "edu", "", "Australia", "2017"], ["Towards semantic visual representation: augmenting image representation with natural language descriptors", "Indian Institute of Science, Bangalore, India", "Indian Institute of Science Bangalore", "Indian Institute of Science Bangalore", "IISc, Gulmohar Marg, RMV Stage II - 1st Block, Aramane Nagara Ward, West Zone, Bengaluru, Bangalore Urban, Karnataka, 560012, India", "13.02223470", "77.56718325", "edu", "", "India", "2016"], ["Sequence to Sequence -- Video to Text", "", "University of California, Berkeley", "University of California, Berkeley", "Berkeley Art Museum and Pacific Film Archive, Bancroft Way, Southside, Berkeley, Alameda County, California, 94720-1076, USA", "37.86871260", "-122.25586815", "edu", "", "United States", "2015"], ["Efficient Coarse-to-Fine Non-Local Module for the Detection of Small Objects.", "", "Weizmann Institute of Science", "Weizmann Institute of Science", "\u05de\u05db\u05d5\u05df \u05d5\u05d9\u05e6\u05de\u05df \u05dc\u05de\u05d3\u05e2, \u05e9\u05d3\u05e8\u05ea \u05de\u05e8\u05db\u05d5\u05e1 \u05d6\u05d9\u05d5, \u05de\u05e2\u05d5\u05e0\u05d5\u05ea \u05e9\u05d9\u05d9\u05df, \u05d0\u05d7\u05d5\u05d6\u05d5\u05ea \u05d4\u05e0\u05e9\u05d9\u05d0, \u05e8\u05d7\u05d5\u05d1\u05d5\u05ea, \u05de\u05d7\u05d5\u05d6 \u05d4\u05de\u05e8\u05db\u05d6, NO, \u05d9\u05e9\u05e8\u05d0\u05dc", "31.90784990", "34.81334092", "edu", "", "Israel", "2018"], ["Semantic Instance Annotation of Street Scenes by 3D to 2D Label Transfer", "", "University of Washington", "University of Washington", "University of Washington, Rainier Vista, Montlake, University District, Seattle, King County, Washington, 98195, USA", "47.65432380", "-122.30800894", "edu", "", "United States", "2016"], ["Active learning for structured probabilistic models with histogram approximation", "Virginia Tech, USA", "Virginia Tech", "Virginia Tech", "Blacksburg, VA 24061, USA", "37.22838430", "-80.42341670", "edu", "", "United States", "2015"], ["RefineNet: Multi-path Refinement Networks for High-Resolution Semantic Segmentation", "", "University of Adelaide", "University of Adelaide", "University of Adelaide, North Terrace, Adelaide, 5000, City of Adelaide, South Australia, 5000, Australia", "-34.91892260", "138.60423668", "edu", "", "Australia", "2017"], ["Beyond caption to narrative: Video captioning with multiple sentences", "", "University of Tokyo", "University of Tokyo", "\u6771\u4eac\u5927\u5b66 \u67cf\u30ad\u30e3\u30f3\u30d1\u30b9, \u5b66\u878d\u5408\u306e\u9053, \u67cf\u5e02, \u5343\u8449\u770c, \u95a2\u6771\u5730\u65b9, 277-8583, \u65e5\u672c", "35.90204480", "139.93622009", "edu", "", "Japan", "2016"], ["Learning to Segment Every Thing", "", "University of California, Berkeley", "University of California, Berkeley", "Berkeley Art Museum and Pacific Film Archive, Bancroft Way, Southside, Berkeley, Alameda County, California, 94720-1076, USA", "37.86871260", "-122.25586815", "edu", "", "United States", "2018"], ["Fast Patch-based Style Transfer of Arbitrary Style.", "", "University of British Columbia", "University of British Columbia", "University of British Columbia, Eagles Drive, Hawthorn Place, University Endowment Lands, Metro Vancouver, British Columbia, V6T, Canada", "49.25839375", "-123.24658161", "edu", "", "Canada", "2016"], ["Encoder-Decoder with Atrous Separable Convolution for Semantic Image Segmentation", "", "Google", "Google, Inc.", "1600 Amphitheatre Pkwy, Mountain View, CA 94043, USA", "37.42199990", "-122.08405750", "company", "Google, Mountain View, CA", "United States", "2018"], ["Mining Object Parts from CNNs via Active Question-Answering", "", "University of California, Los Angeles", "University of California, Los Angeles", "200 UCLA, Medical Plaza Driveway Suite 540, Los Angeles, CA 90095, USA", "34.06877880", "-118.44500940", "edu", "", "United States", "2017"], ["A review of object detection based on convolutional neural network", "Fundamental Science on Communication Information Transmission and Fusion Technology Laboratory, Hangzhou 310018, China", "Fundamental Science on Communication Information Transmission and Fusion Technology Laboratory, Hangzhou 310018, China", "Fundamental Science on Communication Information Transmission and Fusion Technology Laboratory, Hangzhou 310018, China", "Jianggan, Hangzhou, Zhejiang, China, 310018", "30.31600970", "120.37394070", "edu", "", "China", "2017"], ["Online Real-Time Multiple Spatiotemporal Action Localisation and Prediction", "", "Oxford University", "Oxford University", "University College, Logic Lane, Grandpont, Oxford, Oxon, South East, England, OX1 4EX, UK", "51.75208490", "-1.25166460", "edu", "", "United Kingdom", "2017"], ["Procedural Generation of Videos to Train Deep Action Recognition Networks", "", "Toyota Research Institute", "Toyota Research Institute", "Toyota Research Institute, 4440, West El Camino Real, Los Altos, Santa Clara County, California, 94022, USA", "37.40253645", "-122.11655107", "edu", "", "United States", "2017"], ["High-Value Target Detection", "", "University of Tartu", "UNIVERSITY OF TARTU", "Paabel, University of Tartu, 17, \u00dclikooli, Kesklinn, Tartu linn, Tartu, Tartu linn, Tartu maakond, 53007, Eesti", "58.38131405", "26.72078081", "edu", "", "Estonia", "2018"], ["Looking Beyond a Clever Narrative: Visual Context and Attention are Primary Drivers of Affect in Video Advertisements", "", "University of Illinois, Urbana-Champaign", "University of Illinois, Urbana-Champaign", "B-3, South Mathews Avenue, Urbana, Champaign County, Illinois, 61801, USA", "40.11116745", "-88.22587665", "edu", "", "United States", "2018"], ["Counting Everyday Objects in Everyday Scenes", "", "Georgia Institute of Technology", "Georgia Institute of Technology", "Georgia Tech, Atlantic Drive Northwest, Bellwood, Rockdale, Atlanta, Fulton County, Georgia, 30318, USA", "33.77603300", "-84.39884086", "edu", "", "United States", "2017"], ["Bottle Detection in the Wild Using Low-Altitude Unmanned Aerial Vehicles", "Wuhan University, School of Electronic Information, Wuhan, 430072, China", "Wuhan University of Technology", "Wuhan University of Technology", "\u6b66\u6c49\u7406\u5de5\u5927\u5b66-\u4f59\u5bb6\u5934\u6821\u533a, \u4ea4\u901a\u4e8c\u8def, \u6768\u56ed\u8857\u9053, \u6b66\u660c\u533a (Wuchang), \u6b66\u6c49\u5e02, \u6e56\u5317\u7701, 430062, \u4e2d\u56fd", "30.60903415", "114.35142840", "edu", "", "China", "2018"], ["Deep Learning Based Surveillance System for Open Critical Areas", "", "University of Florence", "University of Florence", "Piazza di San Marco, 4, 50121 Firenze FI, Italy", "43.77764260", "11.25976500", "edu", "", "Italy", "2018"], ["An efficient license plate recognition system using convolution neural networks", "Department of Electrical Engineering, National Taiwan Normal University, Taipei 106, Taiwan", "National Taiwan Normal University", "National Taiwan Normal University", "\u5e2b\u5927\u5206\u90e8, 88, \u6c40\u5dde\u8def\u56db\u6bb5, \u842c\u5e74\u91cc, \u6587\u5c71\u5340, \u81fa\u5317\u5e02, 11677, \u81fa\u7063", "25.00823205", "121.53577153", "edu", "", "Taiwan", "2018"], ["Online Adaptation of Convolutional Neural Networks for Video Object Segmentation", "", "RWTH Aachen University", "RWTH Aachen University", "RWTH Aachen, Mies-van-der-Rohe-Stra\u00dfe, K\u00f6nigsh\u00fcgel, Aachen-Mitte, Aachen, St\u00e4dteregion Aachen, Regierungsbezirk K\u00f6ln, Nordrhein-Westfalen, 52074, Deutschland", "50.77917030", "6.06728733", "edu", "", "Germany", "2017"], ["Improving Generalization via Scalable Neighborhood Component Analysis", "", "Microsoft Research Asia", "Microsoft Research Asia", "1 Memorial Dr, Cambridge, MA 02142, USA", "42.36142560", "-71.08120920", "company", "", "United States", "2018"], ["Attacking Visual Language Grounding with Adversarial Examples: A Case Study on Neural Image Captioning", "", "IBM Research, North Carolina", "IBM Research", "IBM, East Cornwallis Road, Research Triangle Park, Nelson, Durham County, North Carolina, 27709, USA", "35.90422720", "-78.85565763", "company", "", "United States", "2018"], ["Incremental Segmentation on Private Data without Catastrophic Forgetting", "", "Peking University", "Peking University", "\u5317\u4eac\u5927\u5b66, 5\u53f7, \u9890\u548c\u56ed\u8def, \u7a3b\u9999\u56ed\u5357\u793e\u533a, \u6d77\u6dc0\u533a, \u5317\u4eac\u5e02, 100871, \u4e2d\u56fd", "39.99223790", "116.30393816", "edu", "", "China", "2018"], ["Intelligent Computing Methodologies", "Tongji University, Shanghai, China", "Tongji University", "Tongji University", "\u540c\u6d4e\u5927\u5b66, 1239, \u56db\u5e73\u8def, \u6c5f\u6e7e, \u8679\u53e3\u533a, \u4e0a\u6d77\u5e02, 200092, \u4e2d\u56fd", "31.28473925", "121.49694909", "edu", "", "China", "2018"], ["An Intriguing Influence of Visual Data in Learning a Representation", "", "Carnegie Mellon University", "Carnegie Mellon University", "Carnegie Mellon University Silicon Valley, South Akron Road, ARC, Santa Clara County, California, 94035-0016, USA", "37.41021930", "-122.05965487", "edu", "", "United States", "2018"], ["Multiview Supervision By Registration", "", "University of Minnesota", "University of Minnesota", "WeismanArt, 333, East River Parkway, Marcy-Holmes, Phillips, Minneapolis, Hennepin County, Minnesota, 55455, USA", "44.97308605", "-93.23708813", "edu", "", "United States", "2018"], ["On the Iterative Refinement of Densely Connected Representation Levels for Semantic Segmentation", "", "Computer Vision Center, Barcelona", "Computer Vision Center, Barcelona", "Campus UAB, Edifici O, s/n, 08193 Cerdanyola del Vall\u00e8s, Barcelona, Spain", "41.50089570", "2.11155300", "edu", "", "Spain", "2018"], ["Multi-evidence Filtering and Fusion for Multi-label Classification, Object Detection and Semantic Segmentation Based on Weakly Supervised Learning", "", "University of Hong Kong", "University of Hong Kong", "\u6d77\u6d0b\u79d1\u5b78\u7814\u7a76\u6240 The Swire Institute of Marine Science, \u9db4\u5480\u9053 Cape D'Aguilar Road, \u9db4\u5480\u4f4e\u96fb\u53f0 Cape D'Aguilar Low-Level Radio Station, \u77f3\u6fb3 Shek O, \u82bd\u83dc\u5751\u6751 Nga Choy Hang Tsuen, \u5357\u5340 Southern District, \u9999\u6e2f\u5cf6 Hong Kong Island, HK, \u4e2d\u56fd", "22.20814690", "114.25964115", "edu", "", "China", "2018"], ["DeepDiary: Automatic Caption Generation for Lifelogging Image Streams.", "", "Indiana University", "Indiana University", "Indiana University East, West Cart Road, Richmond, Wayne County, Indiana, 47374, USA", "39.86948105", "-84.87956905", "edu", "", "United States", "2016"], ["Inferring Semantic Layout for Hierarchical Text-to-Image Synthesis", "", "University of Michigan", "University of Michigan", "University of Michigan, 500, Hayward Street, Ann Arbor, Washtenaw County, Michigan, 48109, USA", "42.29421420", "-83.71003894", "edu", "", "United States", "2018"], ["Progressive Visual Object Detection with Positive Training Examples Only", "Department of Signal Processing, Tampere University of Technology, Tampere, Finland", "Tampere University of Technology", "Tampere University of Technology", "TTY, 10, Korkeakoulunkatu, Finninm\u00e4ki, Hervanta, Tampere, Tampereen seutukunta, Pirkanmaa, L\u00e4nsi- ja Sis\u00e4-Suomen aluehallintovirasto, L\u00e4nsi-Suomi, Manner-Suomi, 33720, Suomi", "61.44964205", "23.85877462", "edu", "", "Finland", "2015"], ["Text-to-Image Generation Using Multi-Instance StackGan", "", "Stanford University", "Stanford University", "Stanford University, Memorial Way, Stanford, Santa Clara County, California, 94305-6015, USA", "37.43131385", "-122.16936535", "edu", "", "United States", ""], ["Bundled Object Context for Referring Expressions", "Key Laboratory of Intelligent Information Processing of Chinese Academy of Sciences (CAS), Institute of Computing Technology, CAS, Beijing, China", "Chinese Academy of Sciences", "Chinese Academy of Sciences", "\u4e2d\u56fd\u79d1\u5b66\u9662\u5fc3\u7406\u7814\u7a76\u6240, 16, \u6797\u8403\u8def, \u671d\u9633\u533a / Chaoyang, \u5317\u4eac\u5e02, 100101, \u4e2d\u56fd", "40.00447950", "116.37023800", "edu", "", "China", "2018"], ["Quantifying the visual concreteness of words and topics in multimodal datasets", "", "Cornell University", "Cornell University", "Cornell University, Forest Home Drive, Forest Home, Tompkins County, New York, 14853, USA", "42.45055070", "-76.47835130", "edu", "", "United States", "2018"], ["A task in a suit and a tie: paraphrase generation with semantic augmentation", "", "University of Texas at Austin", "University of Texas at Austin", "University of Texas at Austin, 1, East 23rd Street, The Drag, Austin, Travis County, Texas, 78712, USA", "30.28415100", "-97.73195598", "edu", "", "United States", "2018"], ["Show, Adapt and Tell: Adversarial Training of Cross-Domain Image Captioner", "", "Microsoft Research Asia", "Microsoft Research Asia", "1 Memorial Dr, Cambridge, MA 02142, USA", "42.36142560", "-71.08120920", "company", "", "United States", "2017"], ["Learning Visual Classifiers using Human-centric Annotations", "", "Microsoft", "Microsoft Corporation, Redmond, WA, USA", "One Microsoft Way, Redmond, WA 98052, USA", "47.64233180", "-122.13693020", "company", "", "United States", "2015"], ["FoveaNet: Perspective-Aware Urban Scene Parsing", "", "Tsinghua University", "Tsinghua University", "\u6e05\u534e\u5927\u5b66, 30, \u53cc\u6e05\u8def, \u4e94\u9053\u53e3, \u540e\u516b\u5bb6, \u6d77\u6dc0\u533a, 100084, \u4e2d\u56fd", "40.00229045", "116.32098908", "edu", "", "China", "2017"], ["Exploiting Saliency for Object Segmentation from Image Level Labels", "", "University of Amsterdam", "University of Amsterdam", "Institute for Logic, Language and Computation (ILLC), 107, Science Park, Oost-Watergraafsmeer, Amsterdam, Oost, Amsterdam, Noord-Holland, Nederland, 1098XG, Nederland", "52.35536550", "4.95016440", "edu", "", "Netherlands", "2017"], ["A Structured Model For Action Detection", "", "Carnegie Mellon University", "Carnegie Mellon University", "Carnegie Mellon University Silicon Valley, South Akron Road, ARC, Santa Clara County, California, 94035-0016, USA", "37.41021930", "-122.05965487", "edu", "", "United States", "2018"], ["RepMet: Representative-based metric learning for classification and one-shot object detection", "", "Technion", "Technion", "Haifa, 3200003, Israel", "32.77677830", "35.02312710", "edu", "", "Israel", "2018"], ["What is the Role of Recurrent Neural Networks (RNNs) in an Image Caption Generator?", "", "University of Malta", "University of Malta", "University of Malta, Ring Road, Japanese Garden, L-Imsida, Malta, MSD 9027, Malta", "35.90232260", "14.48341890", "edu", "", "Malta", "2017"], ["Batch-normalized recurrent highway networks", "", "Rochester Institute of Technology", "Rochester Institute of Technology", "Rochester Institute of Technology (RIT), 1, Lomb Memorial Drive, Bailey, Henrietta Town, Monroe County, New York, 14623, USA", "43.08250655", "-77.67121663", "edu", "", "United States", "2017"], ["Weakly Supervised Semantic Segmentation Using Web-Crawled Videos", "", "DGIST", "DGIST", "South Korea, Daegu, Dalseong-gun, Yuga-myeon, \ud14c\ud06c\ub178\uc911\uc559\ub300\ub85c 333", "35.70528600", "128.45710200", "edu", "", "South Korea", "2017"], ["Talking about other people: an endless range of possibilities", "", "University of Copenhagen", "University of Copenhagen", "K\u00f8benhavns Universitet, Krystalgade, K\u00f8dbyen, Vesterbro, K\u00f8benhavn, K\u00f8benhavns Kommune, Region Hovedstaden, 1165, Danmark", "55.68015020", "12.57232700", "edu", "", "Denmark", "2018"], ["What Actions are Needed for Understanding Human Actions in Videos?", "", "Carnegie Mellon University", "Carnegie Mellon University", "Carnegie Mellon University Silicon Valley, South Akron Road, ARC, Santa Clara County, California, 94035-0016, USA", "37.41021930", "-122.05965487", "edu", "", "United States", "2017"], ["Kobe University , NICT and University of Siegen at TRECVID 2017 AVS Task", "", "Kobe University", "Kobe University", "\u795e\u6238\u5927\u5b66, \u7058\u4e09\u7530\u7dda, \u7058\u533a, \u795e\u6238\u5e02, \u5175\u5eab\u770c, \u8fd1\u757f\u5730\u65b9, 657-00027, \u65e5\u672c", "34.72757140", "135.23710000", "edu", "", "Japan", "2018"], ["DeepSign: Deep Learning based Traffic Sign Recognition", "The State Key Laboratory of Management and Control for Complex Systems, Institute of Automation, Chinese Academy of Sciences, Beijing, China", "Chinese Academy of Sciences", "Chinese Academy of Sciences", "\u4e2d\u56fd\u79d1\u5b66\u9662\u5fc3\u7406\u7814\u7a76\u6240, 16, \u6797\u8403\u8def, \u671d\u9633\u533a / Chaoyang, \u5317\u4eac\u5e02, 100101, \u4e2d\u56fd", "40.00447950", "116.37023800", "edu", "", "China", "2018"]]}
\ No newline at end of file |
