site/datasets/unknown/voc.json


1

{"id": "0ee1916a0cb2dc7d3add086b5f1092c3d4beb38a", "citations": [{"id": "c399c0089fb134d1476fadf5f0426e0e8b70eebd", "title": "The Lov\u00e1sz Hinge: A Novel Convex Surrogate for Submodular Losses.", "year": "2018", "pdf": ["https://arxiv.org/pdf/1512.07797.pdf"], "doi": []}, {"id": "6b6fcf1220ea100aa80004018c78b137289d3c50", "title": "CAD: Scale Invariant Framework for Real-Time Object Detection", "year": "2017", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=8265304"]}, {"id": "656f05741c402ba43bb1b9a58bcc5f7ce2403d9a", "title": "Supervised Learning Approaches for Automatic Structuring of Videos. (M\u00e9thodes d'apprentissage supervis\u00e9 pour la structuration automatique de vid\u00e9os)", "year": "2015", "pdf": ["https://pdfs.semanticscholar.org/656f/05741c402ba43bb1b9a58bcc5f7ce2403d9a.pdf"], "doi": []}, {"id": "aa3398e15395a2a380c7c6b3f274c8c60fb0b48c", "title": "Chained Cascade Network for Object Detection", "year": "2017", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=8237476"]}, {"id": "e58434a01c45505995b000f5e631843a2f2ea582", "title": "Scale coding bag of deep features for human attribute and action recognition", "year": "2017", "pdf": ["https://arxiv.org/pdf/1612.04884.pdf"], "doi": []}, {"id": "eaf65c7cf4e9f7868c61f48656cb608fae0adcee", "title": "Visual dictionaries as intermediate features in the human brain", "year": "2014", "pdf": ["http://journal-cdn.frontiersin.org/article/104962/files/pubmed-zip/versions/1/pdf", "http://journal.frontiersin.org/article/10.3389/fncom.2014.00168/pdf", "https://pure.uva.nl/ws/files/2455021/162945_fncom_08_00168.pdf"], "doi": ["https://www.ncbi.nlm.nih.gov/pubmed/25642183", "http://doi.org/10.3389/fncom.2014.00168", "https://www.wikidata.org/entity/Q34969835"]}, {"id": "4c5d723dd83250c6b289c94318717de2d373a6ed", "title": "Learning Image Classification and Retrieval Models", "year": "2012", "pdf": [], "doi": []}, {"id": "841a5de1d71a0b51957d9be9d9bebed33fb5d9fa", "title": "PCANet: A Simple Deep Learning Baseline for Image Classification?", "year": "2015", "pdf": ["https://arxiv.org/pdf/1404.3606.pdf"], "doi": []}, {"id": "095ccb4e2e0f3934dc1aa51c685b2f54c8a6e588", "title": "Derivate-based Component-Trees for Multi-Channel Image Segmentation", "year": "2017", "pdf": ["https://arxiv.org/pdf/1705.01906.pdf"], "doi": []}, {"id": "a221588fd2d062462254481cfd9563fec2f7c387", "title": "Deep neural network ensemble architecture for eye movements classification", "year": "2018", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=8345537"]}, {"id": "67126ad0af544740c455311d08cb180aec830a6c", "title": "Generating Descriptions of Spatial Relations between Objects in Images", "year": "2015", "pdf": ["https://pdfs.semanticscholar.org/6712/6ad0af544740c455311d08cb180aec830a6c.pdf"], "doi": []}, {"id": "823db813f036365cf9b22b2081ec167a2b582532", "title": "Segmentation and Shape Extraction from Convolutional Neural Networks", "year": "2018", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=8354273", "http://doi.ieeecomputersociety.org/10.1109/WACV.2018.00169", "http://doi.org/10.1109/WACV.2018.00169", "http://www.grk1564.uni-siegen.de/publicationPDFbyID?ID=926"]}, {"id": "f3ccdf54a3384e601fa36969e7b3f657e2516a3b", "title": "Paying More A ention to Saliency : Image Captioning with Saliency and Context A ention 1 : 3", "year": "2017", "pdf": [], "doi": []}, {"id": "2c9c597ab660815e07980e9655c3c5989402205b", "title": "Vision-Based Reacquisition for Task-Level Control", "year": "2010", "pdf": ["https://pdfs.semanticscholar.org/2c9c/597ab660815e07980e9655c3c5989402205b.pdf"], "doi": []}, {"id": "aae1bf434983545c8a99a5dbfc2ce37435c76e03", "title": "SampleAhead: Online Classifier-Sampler Communication for Learning from Synthesized Data", "year": "2018", "pdf": ["https://arxiv.org/pdf/1804.00248.pdf"], "doi": []}, {"id": "ff18125a8f549135e6320fed91d0002bd2dae635", "title": "Colour Terms: a Categorisation Model Inspired by Visual Cortex Neurons", "year": "2017", "pdf": ["https://arxiv.org/pdf/1709.06300.pdf"], "doi": []}, {"id": "3e50e351687779c05390daf117f0394d1556cd3c", "title": "Die Detektion interessanter Objekte unter Verwendung eines objektbasierten Aufmerksamkeitsmodells", "year": "2016", "pdf": ["https://pdfs.semanticscholar.org/3e50/e351687779c05390daf117f0394d1556cd3c.pdf"], "doi": []}, {"id": "065f05c9cb2a6080191851dd82cd9b439a77499a", "title": "Comparing Boosted Cascades to Deep Learning Architectures for Fast and Robust Coconut Tree Detection in Aerial Images", "year": "2018", "pdf": ["https://pdfs.semanticscholar.org/065f/05c9cb2a6080191851dd82cd9b439a77499a.pdf"], "doi": []}, {"id": "4ba503d8f173880d8e8402808f54b78b653e5d20", "title": "Accelerating Stochastic Gradient Descent via Online Learning to Sample", "year": "2015", "pdf": ["https://pdfs.semanticscholar.org/4ba5/03d8f173880d8e8402808f54b78b653e5d20.pdf"], "doi": []}, {"id": "03a2235fea70317461222fac05e38ee35ead9711", "title": "Implementation of a Computer Vision Algorithm for Onboard Detection of Unmanned Aircraft submitted by Luk\u00e1\u0161 Bauer", "year": "2018", "pdf": ["https://pdfs.semanticscholar.org/03a2/235fea70317461222fac05e38ee35ead9711.pdf"], "doi": []}, {"id": "d07dabdea9e2e4546b09d07a019723ceb6c61b84", "title": "Deep learning for text spotting", "year": "2015", "pdf": [], "doi": []}, {"id": "7f66ff8dd0313fc9c7d67be7ea5aecdda956657c", "title": "Tracking-by-Segmentation with Online Gradient Boosting Decision Tree", "year": "2015", "pdf": ["http://openaccess.thecvf.com/content_iccv_2015/papers/Son_Tracking-by-Segmentation_With_Online_ICCV_2015_paper.pdf", "http://www.cv-foundation.org/openaccess/content_iccv_2015/papers/Son_Tracking-by-Segmentation_With_Online_ICCV_2015_paper.pdf"], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=7410707", "http://doi.ieeecomputersociety.org/10.1109/ICCV.2015.350", "http://doi.org/10.1109/ICCV.2015.350"]}, {"id": "4896c9f6958137c88db29a3a707aafae3c29d106", "title": "Discriminative Re-ranking of Diverse Segmentations", "year": "2013", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=6619095"]}, {"id": "858555b6f4663fe083d6c81a2671c9cd8130bbf3", "title": "Object Discovery via Cohesion Measurement", "year": "2018", "pdf": ["https://arxiv.org/pdf/1704.08944.pdf"], "doi": []}, {"id": "f81f5da2a1e4eb80b465b8dffca4c9e583a8a8a6", "title": "Rapid Object Detection Systems , Utilising Deep Learning and Unmanned Aerial Systems ( Uas ) for Civil Engineering Applications", "year": "2018", "pdf": ["https://pdfs.semanticscholar.org/f81f/5da2a1e4eb80b465b8dffca4c9e583a8a8a6.pdf"], "doi": []}, {"id": "369bd35ab8bad4c7bc5e376cc776a5366d97b12e", "title": "An Object Detector Trained on Line Drawings", "year": "2012", "pdf": ["https://pdfs.semanticscholar.org/369b/d35ab8bad4c7bc5e376cc776a5366d97b12e.pdf"], "doi": []}, {"id": "46971fb6caa61c606b046da855be4e196a830ccf", "title": "Identification of Scene Text by Character Descriptor in Smart Mobile Devices", "year": "2015", "pdf": ["https://pdfs.semanticscholar.org/4697/1fb6caa61c606b046da855be4e196a830ccf.pdf"], "doi": []}, {"id": "afad16c9fee11d8f78785af6b1856beb86b5ccf4", "title": "Explain to Fix: A Framework to Interpret and Correct DNN Object Detector Predictions", "year": "2018", "pdf": ["https://arxiv.org/pdf/1811.08011.pdf"], "doi": []}, {"id": "9089280062cf40870a322d687c2850d45c02ebae", "title": "Single Image Action Recognition by Predicting Space-Time Saliency", "year": "2017", "pdf": ["https://arxiv.org/pdf/1705.04641.pdf"], "doi": []}, {"id": "cf384eda31030a45238ebd8356ace7600da5076b", "title": "Cross-Domain CNN for Hyperspectral Image Classification", "year": "2018", "pdf": ["https://arxiv.org/pdf/1802.00093.pdf"], "doi": []}, {"id": "44c5e66e58dd8212b753662e08cc0a7c8327ec50", "title": "Scene Parsing with Object Instance Inference Using Regions and Per-exemplar Detectors", "year": "2014", "pdf": ["http://slazebni.cs.illinois.edu/publications/jtighe-ijcv14.pdf", "http://wwwx.cs.unc.edu/~mn/sites/default/files/jtighe-ijcv14.pdf"], "doi": ["https://doi.org/10.1007/s11263-014-0778-5"]}, {"id": "83acbf0bee402b0472ff101cee5942f4137d91c3", "title": "Semi-automatic Annotation on Image Segmentation Hierarchies", "year": "2012", "pdf": ["https://pdfs.semanticscholar.org/83ac/bf0bee402b0472ff101cee5942f4137d91c3.pdf"], "doi": []}, {"id": "e9af96d478b487fec9a06dde9e43b2ed3355ea7b", "title": "Automatic thresholding of SIFT descriptors", "year": "2016", "pdf": ["https://arxiv.org/pdf/1811.03173.pdf"], "doi": []}, {"id": "b1369e4785dd0b23f89ca76f45468049c8667863", "title": "1 DARTS : Deceiving Autonomous Cars with Toxic Signs", "year": "2018", "pdf": [], "doi": []}, {"id": "1a5151b4205ab27b1c76f98964debbfc11b124d5", "title": "Self Paced Deep Learning for Weakly Supervised Object Detection", "year": "2018", "pdf": ["https://arxiv.org/pdf/1605.07651.pdf"], "doi": []}, {"id": "f1d8c377093ecf64afd7f17383738e81666fe5ae", "title": "Remote Detection of Idling Cars Using Infrared Imaging and Deep Networks", "year": "2018", "pdf": ["https://arxiv.org/pdf/1804.10805.pdf"], "doi": []}, {"id": "12ff1c48f5776fda9d156c7b324af3f2674420a9", "title": "Are Large Scale Training Images or Discriminative Features Important for Codebook Construction?", "year": "2016", "pdf": ["https://pdfs.semanticscholar.org/12ff/1c48f5776fda9d156c7b324af3f2674420a9.pdf"], "doi": []}, {"id": "e4dc24e4926df4de3e8d7ca7cd1f4115e91f03e1", "title": "Instance-level video segmentation from object tracks Anonymous CVPR submission", "year": "", "pdf": ["https://pdfs.semanticscholar.org/e4dc/24e4926df4de3e8d7ca7cd1f4115e91f03e1.pdf"], "doi": []}, {"id": "194af94f1ea9357bebb0aab5ab98aa0daa21ddbd", "title": "Snapshot Distillation: Teacher-Student Optimization in One Generation", "year": "2018", "pdf": ["https://arxiv.org/pdf/1812.00123.pdf"], "doi": []}, {"id": "9d67f5adf4497ba99201d318cfbbed07e926c05b", "title": "Unseen Object Segmentation in Videos via Transferable Representations", "year": "2019", "pdf": ["https://arxiv.org/pdf/1901.02444.pdf"], "doi": []}, {"id": "0caef87116f62fcc86735401a9aa9d4e170ffbef", "title": "On Performance Evaluation of Driver Hand Detection Algorithms: Challenges, Dataset, and Metrics", "year": "2015", "pdf": ["http://cvrr.ucsd.edu/eshed/papers/Das_ITSC2015.pdf", "http://cvrr.ucsd.edu/publications/2015/DasOhnbarTrivedi_ITSC2015.pdf"], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=7313566", "http://doi.org/10.1109/ITSC.2015.473"]}, {"id": "806aea24148fc2ef851803c216a0a25894d78bf4", "title": "Correlation filter based visual trackers for person pursuit using a low-cost Quadrotor", "year": "2015", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=7294481", "http://doi.org/10.1109/I4CS.2015.7294481"]}, {"id": "63ed42249d7cbb21a4b0d42419d42b014ff114eb", "title": "Comprehensive Parameter Sweep for Learning-Based Detector on Traffic Lights", "year": "2016", "pdf": ["https://pdfs.semanticscholar.org/4817/826f1af10e0c31dee067f8d9255d6387d486.pdf"], "doi": []}, {"id": "1b1323b4677c640ae8835a9ccab611ca1e9652e3", "title": "Robust object tracking with a hierarchical ensemble framework", "year": "2016", "pdf": ["https://arxiv.org/pdf/1509.06925.pdf"], "doi": []}, {"id": "557e5e38a4c5b95e2bc86f491b03e5c8c7add857", "title": "Thin-Slicing for Pose: Learning to Understand Pose without Explicit Pose Estimation", "year": "2016", "pdf": ["http://openaccess.thecvf.com/content_cvpr_2016/papers/Kwak_Thin-Slicing_for_Pose_CVPR_2016_paper.pdf", "http://www.cv-foundation.org/openaccess/content_cvpr_2016/papers/Kwak_Thin-Slicing_for_Pose_CVPR_2016_paper.pdf", "http://www.di.ens.fr/willow/pdfscurrent/kwak2016.pdf", "https://vlg.dgist.ac.kr/research/pose_emb/data/CVPR2016_pose.pdf"], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=7780903", "http://doi.ieeecomputersociety.org/10.1109/CVPR.2016.534", "http://doi.org/10.1109/CVPR.2016.534"]}, {"id": "6bcc2b50e32bdbb0c668f75000badf21e6cd0839", "title": "Knowledge Projection for Deep Neural Networks", "year": "2017", "pdf": ["https://arxiv.org/pdf/1710.09505.pdf"], "doi": []}, {"id": "071680ca97de050a372ea79f2b99f102bb3ca6ef", "title": "Inferring Unseen Views of People", "year": "2014", "pdf": ["http://vision.cs.utexas.edu/projects/infering_unseen_views_of_people/inferring-unseen-views-of-people-paper.pdf", "http://vision.cs.utexas.edu/projects/infering_unseen_views_of_people/inferring-unseen-views-of-people-poster.pdf", "http://vision.cs.utexas.edu/projects/infering_unseen_views_of_people/supp.pdf", "http://www.cs.utexas.edu/~chaoyeh/cvpr_2014_Inferring_Unseen_Views_of_People%20(2).pdf", "http://www.cs.utexas.edu/~grauman/papers/chen-pose-cvpr2014.pdf", "http://www.cv-foundation.org/openaccess/content_cvpr_2014/papers/Chen_Inferring_Unseen_Views_2014_CVPR_paper.pdf"], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=6909655", "http://doi.ieeecomputersociety.org/10.1109/CVPR.2014.258", "http://doi.org/10.1109/CVPR.2014.258"]}, {"id": "415c0eecce9fde7d1ba9c70bd0bfa5471760c117", "title": "Oriented Object Proposals", "year": "2015", "pdf": ["http://openaccess.thecvf.com/content_iccv_2015/papers/He_Oriented_Object_Proposals_ICCV_2015_paper.pdf", "http://www.cs.cityu.edu.hk/~rynson/papers/iccv15.pdf", "http://www.cv-foundation.org/openaccess/content_iccv_2015/papers/He_Oriented_Object_Proposals_ICCV_2015_paper.pdf"], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=7410397", "http://doi.ieeecomputersociety.org/10.1109/ICCV.2015.40", "http://doi.org/10.1109/ICCV.2015.40"]}, {"id": "f865248065b8d6bcbce4a4053b73e4de2080ba23", "title": "Efficient object detection for high resolution images", "year": "2015", "pdf": ["https://arxiv.org/pdf/1510.01257.pdf"], "doi": []}, {"id": "e0e19769ad446c2a74c0616fcfb551059c899ce6", "title": "Part level transfer regularization for enhancing exemplar SVMs", "year": "2015", "pdf": ["http://people.csail.mit.edu/yusuf/publications/2015/Aytar15/aytar15.pdf"], "doi": ["http://doi.org/10.1016/j.cviu.2015.04.004"]}, {"id": "009fba8df6bbca155d9e070a9bd8d0959bc693c2", "title": "Rich Feature Hierarchies for Accurate Object Detection and Semantic Segmentation", "year": "2014", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=6909475"]}, {"id": "a0703bef11c978cc8faf05eb229e29a889f8a0b1", "title": "Superpixel Hierarchy", "year": "2018", "pdf": ["https://arxiv.org/pdf/1605.06325.pdf"], "doi": []}, {"id": "472de7b3c674e8f06702385569779d11b71bc8f2", "title": "Superpixel Coherency and Uncertainty Models for Semantic Segmentation", "year": "2013", "pdf": ["http://cvlab.postech.ac.kr/~tgx.lim/paper/iccv2013_semantic.pdf", "http://www.cv-foundation.org/openaccess/content_iccv_workshops_2013/W08/papers/Baek_Superpixel_Coherency_and_2013_ICCV_paper.pdf"], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=6755909"]}, {"id": "73818ae13a89c2377c30cdb029fdb7e490fe5367", "title": "Joint cost minimization for multi-object tracking", "year": "2017", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=8078481", "http://doi.ieeecomputersociety.org/10.1109/AVSS.2017.8078481", "http://doi.org/10.1109/AVSS.2017.8078481"]}, {"id": "ba51ce1ec7b18fa808985b919f4a201fe5e4bafb", "title": "Semantic parsing for priming object detection in indoors RGB-D scenes", "year": "2015", "pdf": ["https://pdfs.semanticscholar.org/ba51/ce1ec7b18fa808985b919f4a201fe5e4bafb.pdf"], "doi": []}, {"id": "23e707600c3e9a240e24eaa4ed4b0e4ec6a436c1", "title": "Automatic foreground extraction via joint CRF and online learning", "year": "2013", "pdf": ["https://pdfs.semanticscholar.org/7f3b/115dd38a933f3a88e3b20b58862216297d63.pdf"], "doi": []}, {"id": "c5632e2117d268159225d5c307b7efbb6428ccba", "title": "Understanding image concepts using ISTOP model", "year": "2016", "pdf": ["http://www.cs.uu.nl/groups/MG/multimedia/publications/art/PR2016b.pdf"], "doi": ["http://doi.org/10.1016/j.patcog.2015.11.010"]}, {"id": "773fd71d3d24c268c99e1c53ae87a28da3bbe0f6", "title": "Conditional Entropies as Over-Segmentation and Under-Segmentation Metrics for Multi-Part Image Segmentation", "year": "2011", "pdf": [], "doi": []}, {"id": "0435a34e93b8dda459de49b499dd71dbb478dc18", "title": "VEGAC: Visual Saliency-based Age, Gender, and Facial Expression Classification Using Convolutional Neural Networks", "year": "2018", "pdf": [], "doi": []}, {"id": "02567fd428a675ca91a0c6786f47f3e35881bcbd", "title": "Deep Label Distribution Learning With Label Ambiguity", "year": "2017", "pdf": ["https://arxiv.org/pdf/1611.01731.pdf"], "doi": []}, {"id": "9ea7205ef136f207123cd6b54e15075835ae0049", "title": "Self-supervised language grounding by active sensing combined with Internet acquired images and text", "year": "2017", "pdf": ["https://pdfs.semanticscholar.org/9ea7/205ef136f207123cd6b54e15075835ae0049.pdf"], "doi": []}, {"id": "6452d294af27b1f9408c9522bfb98bf00e1e4732", "title": "A novel infrared video surveillance system using deep learning based techniques", "year": "2018", "pdf": ["https://ore.exeter.ac.uk/repository/bitstream/handle/10871/32083/MTA-manuscript-revision-R2-accepted.pdf?isAllowed=y&sequence=1", "https://repository.edgehill.ac.uk/10281/6/MTA-manuscript-revision-R2.pdf"], "doi": ["https://doi.org/10.1007/s11042-018-5883-y"]}, {"id": "191beb87f84326d2cc9c427efe2a5abee8f67574", "title": "Dual Local-Global Contextual Pathways for Recognition in Aerial Imagery", "year": "2016", "pdf": ["https://arxiv.org/pdf/1605.05462.pdf"], "doi": []}, {"id": "5020a75c45416073d0b07b1deb7382bc80de1779", "title": "Human Detection Using Learned Part Alphabet and Pose Dictionary", "year": "2014", "pdf": ["http://cis-linux1.temple.edu/~latecki/Papers/HumanDetectionECCV2014.pdf", "http://mc.eistar.net/UpLoadFiles/Papers/%5B38%5D%202014%20ECCV%20Yaocong.pdf", "http://vigir.missouri.edu/~gdesouza/Research/Conference_CDs/ECCV_2014/papers/8693/86930251.pdf", "https://cis.temple.edu/~latecki/Papers/HumanDetectionECCV2014.pdf"], "doi": ["http://doi.org/10.1007/978-3-319-10602-1_17"]}, {"id": "6e7248f33be3f6b44d6089b7039a5c2d84acaed0", "title": "Object cosegmentation using deep Siamese network", "year": "2018", "pdf": ["https://arxiv.org/pdf/1803.02555.pdf"], "doi": []}, {"id": "b8ccc5341a1b0214e9d155b019962023f344c2ee", "title": "Incremental Learning of Object Detectors without Catastrophic Forgetting", "year": "2017", "pdf": ["https://arxiv.org/pdf/1708.06977.pdf"], "doi": []}, {"id": "37668092cf8b7695d4a85eb7a25e9a2ef0fd0739", "title": "Robust object detection under partial occlusion", "year": "2016", "pdf": [], "doi": []}, {"id": "49f276e1b8fd162ac3cd996becc63cab2b2535b7", "title": "Trained 3D Models for CNN based Object Recognition", "year": "2017", "pdf": ["https://pdfs.semanticscholar.org/49f2/76e1b8fd162ac3cd996becc63cab2b2535b7.pdf"], "doi": []}, {"id": "1426045c4188f09fec46d0d2f246357a230a1748", "title": "Structured Labels in Random Forests for Semantic Labelling and Object Detection", "year": "2014", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=6784137", "http://doi.org/10.1109/TPAMI.2014.2315814", "https://www.ncbi.nlm.nih.gov/pubmed/26352638", "https://www.wikidata.org/entity/Q38404154"]}, {"id": "efe133717899b41cd4c0b0c999da312d3af60a6e", "title": "Depth-Based Hand Pose Estimation: Methods, Data, and Challenges", "year": "2018", "pdf": ["https://arxiv.org/pdf/1504.06378.pdf"], "doi": []}, {"id": "9caa7605c16da42761c8a27327f5f037dbf901fa", "title": "q-Gaussian mixture models for image and video semantic indexing", "year": "2013", "pdf": [], "doi": ["http://doi.org/10.1016/j.jvcir.2013.10.005", "http://t2r2.star.titech.ac.jp/rrws/file/CTT100664441/ATD100000413/"]}, {"id": "4bb84c9b24456fb0bb920ca83280bd9c48ad4b66", "title": "Instance-Level Video Segmentation from Object Tracks", "year": "2016", "pdf": ["http://openaccess.thecvf.com/content_cvpr_2016/papers/Seguin_Instance-Level_Video_Segmentation_CVPR_2016_paper.pdf", "http://www.cv-foundation.org/openaccess/content_cvpr_2016/papers/Seguin_Instance-Level_Video_Segmentation_CVPR_2016_paper.pdf", "http://www.di.ens.fr/willow/pdfscurrent/seguin2016.pdf", "http://www.di.ens.fr/willow/research/instancelevel/seguin16instancelevel.pdf", "http://www.di.ens.fr/~bojanowski/papers/seguin16instance.pdf"], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=7780769", "http://doi.ieeecomputersociety.org/10.1109/CVPR.2016.400", "http://doi.org/10.1109/CVPR.2016.400"]}, {"id": "ce0dbe6b1abecb54dcc98dbe652aa63d190dbc94", "title": "Part-Based Models for Finding People and Estimating Their Pose", "year": "2011", "pdf": ["https://pdfs.semanticscholar.org/ce0d/be6b1abecb54dcc98dbe652aa63d190dbc94.pdf"], "doi": []}, {"id": "a5683661e80668e05170bf17bcbd754d1b07af74", "title": "Comparison of Data Set Bias in Object Recognition Benchmarks", "year": "2015", "pdf": ["http://vfacstaff.ltu.edu/lshamir/publications/object_recognition_dataset_bias.pdf"], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=7299607", "http://doi.org/10.1109/ACCESS.2015.2491921"]}, {"id": "646a669f1dc38ae961fe41fbd3c83cab64ce9d53", "title": "Real-Time Seamless Single Shot 6D Object Pose Prediction", "year": "2018", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=8578136"]}, {"id": "575a0e97702edcb0621a47b574949bac50e34200", "title": "Unsupervised Learning by Predicting Noise", "year": "2017", "pdf": ["https://arxiv.org/pdf/1704.05310.pdf"], "doi": []}, {"id": "b9128ff3b0b96815ff41a7d5fb2b4bef69f635ca", "title": "Deconvolutional Feature Stacking for Weakly-Supervised Semantic Segmentation", "year": "2016", "pdf": ["https://arxiv.org/pdf/1602.04984.pdf"], "doi": []}, {"id": "7c03a0ad5202a6a31ad3b78b11f6b45ecd840616", "title": "Scale-Invariant Feature Learning using Deconvolutional Neural Networks for Weakly-Supervised Semantic Segmentation", "year": "2016", "pdf": ["https://pdfs.semanticscholar.org/7c03/a0ad5202a6a31ad3b78b11f6b45ecd840616.pdf"], "doi": []}, {"id": "17342b1c4caccfc499d9ae55a68d7b93285c5d6b", "title": "Action recognition in still images using a combination of human pose and context information", "year": "2012", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=6466977", "http://doi.org/10.1109/ICIP.2012.6466977"]}, {"id": "571d2b173c2db8ac751dabdfcf5a18c06f365e05", "title": "Improved Part Segmentation Performance by Optimising Realism of Synthetic Images using Cycle Generative Adversarial Networks", "year": "2018", "pdf": ["https://arxiv.org/pdf/1803.06301.pdf"], "doi": []}, {"id": "90e36f66c25a4c73a252102c6c6c329c36d82676", "title": "Probably Unknown: Deep Inverse Sensor Modelling In Radar", "year": "2018", "pdf": ["https://arxiv.org/pdf/1810.08151.pdf"], "doi": []}, {"id": "fb710e9d897b7c1fd5275a0bcfa22711c5768990", "title": "A Graphical Model for Rapid Obstacle Image-Map Estimation from Unmanned Surface Vehicles", "year": "2014", "pdf": ["https://pdfs.semanticscholar.org/fb71/0e9d897b7c1fd5275a0bcfa22711c5768990.pdf"], "doi": []}, {"id": "821ba3eba1e36a29cc482f5378f4a0d0f6893159", "title": "Unsupervised Domain Adaptation for Learning Eye Gaze from a Million Synthetic Images: An Adversarial Approach", "year": "2018", "pdf": ["https://arxiv.org/pdf/1810.07926.pdf"], "doi": []}, {"id": "b50156e76ae03a1c0b04cd2076a99b7f2b441506", "title": "An image classification method that considers privacy-preservation", "year": "2016", "pdf": [], "doi": ["http://doi.org/10.1016/j.neucom.2016.04.056"]}, {"id": "3481a544e28cfc14108b0785eef7c12747e622ee", "title": "Online Multi-object Tracking via Structural Constraint Event Aggregation", "year": "2016", "pdf": ["http://faculty.ucmerced.edu/mhyang/papers/cvpr16_mot.pdf", "http://vc.cs.nthu.edu.tw/home/paper/codfiles/melu/201703210652/Online%20Multi-Object%20Tracking%20via%20Structural%20Constraint%20Event%20Aggregation.pdf", "http://www.cv-foundation.org/openaccess/content_cvpr_2016/papers/Yoon_Online_Multi-Object_Tracking_CVPR_2016_paper.pdf"], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=7780524", "http://doi.ieeecomputersociety.org/10.1109/CVPR.2016.155", "http://doi.org/10.1109/CVPR.2016.155"]}, {"id": "7fd5d2b0a034da43a747f6b8be3e51d775a05625", "title": "A Method to Detect Boats in Images of the Amazonian Rivers", "year": "2017", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=8247064", "http://doi.ieeecomputersociety.org/10.1109/BRACIS.2017.73", "http://doi.org/10.1109/BRACIS.2017.73"]}, {"id": "13105c611a059b4825bc92ff9778f532b6a849b2", "title": "Compressing Sparse Feature Vectors Using Random Ortho-Projections", "year": "2010", "pdf": ["http://www.ee.oulu.fi/mvg/files/pdf/PID1267977.pdf", "http://www.ee.oulu.fi/research/mvmp/mvg/files/pdf/PID1267977.pdf", "http://www.rni.helsinki.fi/~msa/pub/ICPR2010.pdf"], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=5597593", "http://doi.ieeecomputersociety.org/10.1109/ICPR.2010.345", "http://doi.org/10.1109/ICPR.2010.345"]}, {"id": "0967341790643f680f3fc9dc87bfe311723be4e4", "title": "A Perception-Driven Transcale Display Scheme for Space Image Sequences", "year": "2018", "pdf": ["https://pdfs.semanticscholar.org/0967/341790643f680f3fc9dc87bfe311723be4e4.pdf"], "doi": []}, {"id": "a8bf49021017e19df051a3efb7337d93ea263e37", "title": "Deep Multiple Instance Hashing for Object-based Image Retrieval", "year": "2017", "pdf": ["https://pdfs.semanticscholar.org/a8bf/49021017e19df051a3efb7337d93ea263e37.pdf"], "doi": []}, {"id": "347ce37f15cea5bb8d0a676562664f80e3609b78", "title": "Pixel Objectness: Learning to Segment Generic Objects Automatically in Images and Videos", "year": "2018", "pdf": ["https://arxiv.org/pdf/1808.04702.pdf"], "doi": []}, {"id": "0755ee472e2bc2968b16f851a16c39b3f3e2d0d0", "title": "From Weakly Supervised Object Localization to Semantic Segmentation by Probabilistic Image Modeling", "year": "2017", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=8227436", "http://doi.org/10.1109/DICTA.2017.8227436"]}, {"id": "659fc2a483a97dafb8fb110d08369652bbb759f9", "title": "Improving the Fisher Kernel for Large-Scale Image Classification", "year": "2010", "pdf": ["https://pdfs.semanticscholar.org/659f/c2a483a97dafb8fb110d08369652bbb759f9.pdf"], "doi": []}, {"id": "1e02dfeb93e8fd8753d2e69baf705baf8996cb81", "title": "Online Object Tracking, Learning and Parsing with And-Or Graphs", "year": "2014", "pdf": ["https://arxiv.org/pdf/1509.08067.pdf"], "doi": []}, {"id": "bdfb5f11d497b44b17d0315c3b6892f835723832", "title": "Object Captioning and Retrieval with Natural Language", "year": "2018", "pdf": ["https://arxiv.org/pdf/1803.06152.pdf"], "doi": []}, {"id": "43fe9006b90137d6ce85a539685ce66c13f0e38e", "title": "A review of image-based automatic facial landmark identification techniques", "year": "", "pdf": ["https://pdfs.semanticscholar.org/43fe/9006b90137d6ce85a539685ce66c13f0e38e.pdf"], "doi": []}, {"id": "642772c38ff690d17a3ce84a1d8646aefc802139", "title": "VIDEO OBJECT TRACKING BASED ON AUTOMATIC BACKGROUND SEGMENTATION : A SURVEY", "year": "2014", "pdf": ["https://pdfs.semanticscholar.org/6427/72c38ff690d17a3ce84a1d8646aefc802139.pdf"], "doi": []}, {"id": "303c08071500421c3aca758e6c7cd6a9fcbda1a8", "title": "Scene understanding with complete scenes and structured representations", "year": "2014", "pdf": [], "doi": []}, {"id": "86f0f71bff42e4bdc60014e4f94ec76d52c8eccf", "title": "Felzenszwalb-Baum-Welch: Event Detection by Changing Appearance", "year": "2013", "pdf": ["https://arxiv.org/pdf/1306.4746.pdf"], "doi": []}, {"id": "d9cc8bc5c4a4b29ab40f75b721bd9e5140d2baf6", "title": "Object Detection for Crime Scene Evidence Analysis Using Deep Learning", "year": "2017", "pdf": ["https://pdfs.semanticscholar.org/6926/4f28158f9245a06f7a2c1ae666241261cc0e.pdf"], "doi": []}, {"id": "d3f6b3ce8f7b67c1e112a79b3fe9764242c655f5", "title": "Recovering from Random Pruning: On the Plasticity of Deep Convolutional Neural Networks", "year": "2018", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=8354202"]}, {"id": "9b6538d09e914c41345812b3086feff1dc1ae218", "title": "Detecting Comma-shaped Clouds for Severe Weather Forecasting using Shape and Motion", "year": "2018", "pdf": ["https://arxiv.org/pdf/1802.08937.pdf"], "doi": []}, {"id": "bf417e1c265b31720b4fb980afb83cc3a573fa6f", "title": "Representations and Similarities of Images for Visual Classification", "year": "2018", "pdf": ["https://pdfs.semanticscholar.org/bf41/7e1c265b31720b4fb980afb83cc3a573fa6f.pdf"], "doi": []}, {"id": "4dc57432fa8fea1614a39c324bf11ae0620cb26f", "title": "Aalborg Universitet Detection of U . S . Traffic", "year": "2015", "pdf": ["https://pdfs.semanticscholar.org/6e53/63af2bfb7d1b2bd13feb41c2688bd0cf12b3.pdf"], "doi": []}, {"id": "878169be6e2c87df2d8a1266e9e37de63b524ae7", "title": "Image interpretation above and below the object level.", "year": "2018", "pdf": ["https://pdfs.semanticscholar.org/8781/69be6e2c87df2d8a1266e9e37de63b524ae7.pdf"], "doi": []}, {"id": "3daafe6389d877fe15d8823cdf5ac15fd919676f", "title": "Human Action Localization with Sparse Spatial Supervision", "year": "2016", "pdf": ["https://arxiv.org/pdf/1605.05197.pdf"], "doi": []}, {"id": "04f9b591cdfa1e3667230ae1224b1dfdac0a8ef1", "title": "Discriminative Segment Annotation in Weakly Labeled Video", "year": "2013", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=6619165"]}, {"id": "4e4f2c4d2ea47636ca2ab795770d6b3214640f37", "title": "Efficient Maximum Appearance Search for Large-Scale Object Detection", "year": "2013", "pdf": ["http://researcher.watson.ibm.com/researcher/files/us-liangliang.cao/qiangcvpr2013_final.pdf", "http://rogerioferis.com/publications/ChenCVPR2013.pdf", "http://vigir.missouri.edu/~gdesouza/Research/Conference_CDs/IEEE_CVPR2013/data/Papers/4989d190.pdf", "http://www.cv-foundation.org/openaccess/content_cvpr_2013/papers/Chen_Efficient_Maximum_Appearance_2013_CVPR_paper.pdf"], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=6619254", "http://doi.ieeecomputersociety.org/10.1109/CVPR.2013.410", "http://doi.org/10.1109/CVPR.2013.410"]}, {"id": "9434524669777d281a8a7358f20181c9e157942e", "title": "VSEM: An open library for visual semantics representation", "year": "2013", "pdf": ["https://pdfs.semanticscholar.org/9434/524669777d281a8a7358f20181c9e157942e.pdf"], "doi": []}, {"id": "0e0900b88c33b671be5dd2ded9885b6526d6b429", "title": "From captions to visual concepts and back", "year": "2015", "pdf": ["https://arxiv.org/pdf/1411.4952.pdf"], "doi": []}, {"id": "4d910c5ab0b70ddbef6be944077ed63821608135", "title": "On Dimensionality Reduction for Indexing and Retrieval of Large-Scale Solar Image Data", "year": "2012", "pdf": ["https://pdfs.semanticscholar.org/4d91/0c5ab0b70ddbef6be944077ed63821608135.pdf"], "doi": []}, {"id": "9076183dcdb28ebb3e547f7ffd3f9d5d0faec531", "title": "Describing Video Contents in Natural Language", "year": "2012", "pdf": [], "doi": []}, {"id": "07764e1607d9e3d8094455adb658077996eb38c4", "title": "End-to-End Trained CNN Encoder-Decoder Networks for Image Steganography", "year": "2018", "pdf": ["https://arxiv.org/pdf/1711.07201.pdf"], "doi": []}, {"id": "46f135110c5fc5f158bc3ffce21b9ae946c7ff68", "title": "Adaptive NormalHedge for robust visual tracking", "year": "2015", "pdf": ["https://core.ac.uk/download/pdf/33581176.pdf", "https://pure.qub.ac.uk/portal/files/13941301/main_huiyu.pdf"], "doi": ["https://doi.org/10.1016/j.sigpro.2014.08.027"]}, {"id": "b961009dedea99f948650df7291a28f18bbfc1dc", "title": "Towards Automated Visual Monitoring of Individual Gorillas in the Wild", "year": "2017", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=8265544"]}, {"id": "7dbc61e2dc497e9dcff98e7df832780cc8a2b60c", "title": "A Flexible Object-of-Interest Annotation Framework for Online Video Portals", "year": "2012", "pdf": ["http://www.mdpi.com/1999-5903/4/1/179/pdf"], "doi": ["https://doi.org/10.3390/fi4010179"]}, {"id": "d4f454b24a7901dea14858808bbe277c7bee8ffb", "title": "Edge-based Component-Trees for Multi-Channel Image Segmentation", "year": "2017", "pdf": [], "doi": []}, {"id": "6768b558cc58e113096540c123ef3b2c2d2469a1", "title": "Maximum Margin Linear Classifiers in Unions of Subspaces", "year": "2016", "pdf": ["https://pdfs.semanticscholar.org/1a06/e518bf15015153b4973bb2e9e06e51485a4c.pdf"], "doi": []}, {"id": "ba6c19771926564e89be4ace7c33dc3da580249e", "title": "Utilisation du contexte pour l'indexation s\u00e9mantique des images et vid\u00e9os. (Using context for semantic indexing of images and videos)", "year": "2014", "pdf": ["https://pdfs.semanticscholar.org/ba6c/19771926564e89be4ace7c33dc3da580249e.pdf"], "doi": []}, {"id": "447b28c347172c6da0fb4d764a534fdee557b7f8", "title": "Studying Relationships between Human Gaze, Description, and Computer Vision", "year": "2013", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=6618945"]}, {"id": "782b21e803d149955c627c063ae60efeae04a9b1", "title": "Analysis of Multilayer Neural Networks for Object Recognition", "year": "2014", "pdf": [], "doi": []}, {"id": "3e01f2fefe219bfeb112f1d82e76ebba4c0e2aac", "title": "Transfer learning via attributes for improved on-the-fly classification", "year": "2014", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=6836097", "http://doi.ieeecomputersociety.org/10.1109/WACV.2014.6836097", "http://doi.org/10.1109/WACV.2014.6836097"]}, {"id": "ba156b81fe8fca1fd1bfb1c822e39205c4ff355b", "title": "Unsupervised Multi-class Joint Image Segmentation", "year": "2014", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=6909798"]}, {"id": "72048081cfe678f700c52e1c7a56713a8e0865b6", "title": "Unsupervised Adversarial Visual Level Domain Adaptation for Learning Video Object Detectors from Images", "year": "2018", "pdf": ["https://arxiv.org/pdf/1810.02074.pdf"], "doi": []}, {"id": "9cd8a2d07f07d888fcf50aa0735d0831edcf5e46", "title": "Bag of contour fragments for robust shape classification", "year": "2014", "pdf": ["http://cis-linux1.temple.edu/~latecki/Papers/XinggangPR2014.pdf", "http://mc.eistar.net/~xwang/pubs/BagOfShape.pdf", "http://mclab.eic.hust.edu.cn/~xwang/pubs/BagOfShape.pdf", "https://cis.temple.edu/~latecki/Papers/XinggangPR2014.pdf"], "doi": ["http://doi.org/10.1016/j.patcog.2013.12.008"]}, {"id": "8c21cd8d5e98c77d727fc900450c6223f9e1fa24", "title": "DARE: Dynamic Adaptive Mobile Augmented Reality with Edge Computing", "year": "2018", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=8526799"]}, {"id": "7fe203374ba3ddc8462a7c775b276e53f09dd036", "title": "NavigationNet: A Large-scale Interactive Indoor Navigation Dataset", "year": "2018", "pdf": ["https://arxiv.org/pdf/1808.08374.pdf"], "doi": []}, {"id": "8f8599012002dd3bbb6526b3be92d7a7355ad22a", "title": "Construction et \u00e9valuation d'un corpus pour la recherche d'instances d'images mus\u00e9ales", "year": "2017", "pdf": ["https://pdfs.semanticscholar.org/8f85/99012002dd3bbb6526b3be92d7a7355ad22a.pdf"], "doi": []}, {"id": "ebf35073e122782f685a0d6c231622412f28a53b", "title": "A High-Quality Denoising Dataset for Smartphone Cameras", "year": "2018", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=8578280"]}, {"id": "9463f71b2d8e291d5fc5a7db6b95b3d01e759b29", "title": "Describing Spatial Relationships between Objects in Images in English and French", "year": "2015", "pdf": ["http://www.emnlp2015.org/proceedings/VL/pdf/VL16.pdf"], "doi": ["https://doi.org/10.18653/v1%2FW15-2816", "http://aclweb.org/anthology/W15-2816", "https://doi.org/10.18653/v1/W15-2816"]}, {"id": "aaa6fe8045e1a071e1762cffe4f59e0bd508daf9", "title": "Single-Pedestrian Detection Aided by Two-Pedestrian Detection", "year": "2015", "pdf": ["http://www.ee.cuhk.edu.hk/~wlouyang/Papers/tpami15-ouyang_xgWang_xyZeng.pdf", "http://www.ee.cuhk.edu.hk/~xgwang/papers/ouyangZWtpami15.pdf"], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=6994306", "http://doi.ieeecomputersociety.org/10.1109/TPAMI.2014.2377734", "http://doi.org/10.1109/TPAMI.2014.2377734", "https://www.ncbi.nlm.nih.gov/pubmed/26353133"]}, {"id": "2a7007555f71e559c6aa33efbd3bd8b401638d82", "title": "Full interpretation of minimal images", "year": "2018", "pdf": ["https://perso.telecom-paristech.fr/bloch/AIC/articles/BenYosef2017.pdf"], "doi": ["https://www.sciencedirect.com/science/article/pii/S001002771730269X?dgcid=api_sd_search-api-endpoint", "http://doi.org/10.1016/j.cognition.2017.10.006", "https://www.ncbi.nlm.nih.gov/pubmed/29107889"]}, {"id": "08c71fe89af5f168b373e92b44a7cf9d1755fb8c", "title": "The Opportunity challenge: A benchmark database for on-body sensor-based activity recognition", "year": "2013", "pdf": ["http://infoscience.epfl.ch/record/182860/files/2013_ChavarriagaPRLETTERS_preprint.pdf?version=1", "https://www.researchgate.net/profile/Ricardo_Chavarriaga/publication/258031577_The_Opportunity_challenge_A_benchmark_database_for_on-body_sensor-based_activity_recognition/links/02e7e528146aa12213000000.pdf"], "doi": ["https://doi.org/10.1016/j.patrec.2012.12.014"]}, {"id": "8d73906f0a232e8b94200017e512446c1af4dd9d", "title": "Detection of U.S. Traffic Signs", "year": "2015", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=7116530"]}, {"id": "497857bce6ea1ed4889fb949a2f176072e2509c7", "title": "A Comparison of L_1 Norm and L_2 Norm Multiple Kernel SVMs in Image and Video Classification", "year": "2009", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=5137808"]}, {"id": "1d5f704a98d82c34de96ceb80fa06552082effd3", "title": "Dynamic Zoom-in Network for Fast Object Detection in Large Images", "year": "2018", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=8578822"]}, {"id": "3de71ddc07619c0dd6bbaa3f7b412a9262a0e761", "title": "Discriminatively Trained And-Or Tree Models for Object Detection", "year": "2013", "pdf": ["http://vigir.missouri.edu/~gdesouza/Research/Conference_CDs/IEEE_CVPR2013/data/Papers/4989d278.pdf", "http://www.cv-foundation.org/openaccess/content_cvpr_2013/papers/Song_Discriminatively_Trained_And-Or_2013_CVPR_paper.pdf", "http://www.stat.ucla.edu/~sczhu/papers/Conf_2013/DiscriminativeAOG_cvpr2013.pdf"], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=6619265", "http://doi.ieeecomputersociety.org/10.1109/CVPR.2013.421", "http://doi.org/10.1109/CVPR.2013.421"]}, {"id": "18b4a20ed465972d9d8f3f8d8982d321acf45907", "title": "Mod\u00e9lisation de contextes pour l'annotation s\u00e9mantique de vid\u00e9os. (Context based modeling for video semantic annotation)", "year": "2013", "pdf": ["https://pdfs.semanticscholar.org/18b4/a20ed465972d9d8f3f8d8982d321acf45907.pdf"], "doi": []}, {"id": "992a614aa601c52b20729538ea25b62471ffe8bc", "title": "Towards Automatic Construction of Diverse, High-quality Image Dataset", "year": "2017", "pdf": ["https://arxiv.org/pdf/1708.06495.pdf"], "doi": []}, {"id": "53822d61e829ef02a95a6c89fea082114fd3e16b", "title": "A General Framework for Tracking Multiple People from a Moving Camera", "year": "2013", "pdf": ["http://www.willowgarage.com/sites/default/files/pami_preprint.pdf"], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=6361406", "http://doi.org/10.1109/TPAMI.2012.248", "https://www.ncbi.nlm.nih.gov/pubmed/23681988", "https://www.wikidata.org/entity/Q48723090"]}, {"id": "323eb410e0d0978901a8baa670f905f280ab19ff", "title": "Inner-Scene Similarities as a Contextual Cue for Object Detection", "year": "2017", "pdf": ["https://arxiv.org/pdf/1707.04406.pdf"], "doi": []}, {"id": "7532996c27b199ed89b412a9f0df7483df83ea72", "title": "Committees of deep feedforward networks trained with few data", "year": "2014", "pdf": ["https://arxiv.org/pdf/1406.5947.pdf"], "doi": []}, {"id": "bf7238df8b3a7fc0ebf0e8028a417c7e99fca8d8", "title": "An ontology-based framework for the automated analysis and interpretation of comic books' images", "year": "2017", "pdf": [], "doi": ["https://doi.org/10.1016/j.ins.2016.10.032", "https://hal.archives-ouvertes.fr/hal-01387033/document"]}, {"id": "c6e042f9db094d3a01c13a9d3120fc6898f40cb8", "title": "Multi-label Classification for Image Annotation via Sparse Similarity Voting", "year": "2010", "pdf": ["http://naosite.lb.nagasaki-u.ac.jp/dspace/bitstream/10069/27087/1/LNCS6469_344.pdf", "https://page-one.springer.com/pdf/preview/10.1007/978-3-642-22819-3_35"], "doi": ["https://doi.org/10.1007/978-3-642-22819-3_35"]}, {"id": "2dd6749ddffa620d2ac40275a436ecd89aa51a45", "title": "Learning Dual Multi-Scale Manifold Ranking for Semantic Segmentation of High-Resolution Images", "year": "2017", "pdf": ["http://www.mdpi.com/2072-4292/9/5/500/pdf"], "doi": ["https://doi.org/10.3390/rs9050500", "https://www.preprints.org/manuscript/201704.0061/v1/download"]}, {"id": "478261574ddc6cf297611000735aa9808f8f0030", "title": "ScanNet: Richly-Annotated 3D Reconstructions of Indoor Scenes", "year": "2017", "pdf": ["https://arxiv.org/pdf/1702.04405.pdf"], "doi": []}, {"id": "c5fcc36768428185c0ec0f04c82c9204c9ba962c", "title": "Deep Material-Aware Cross-Spectral Stereo Matching", "year": "2018", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=8578303"]}, {"id": "e4fc560a78e48bd927c2f6253f5fc489927bb15f", "title": "Detecting objects in internet videos AIMS Project Report", "year": "2015", "pdf": ["https://pdfs.semanticscholar.org/e4fc/560a78e48bd927c2f6253f5fc489927bb15f.pdf"], "doi": []}, {"id": "2049db406168f63c46e5efd2d5ceb5941e3fdc7c", "title": "Region detection and matching for object recognition", "year": "2013", "pdf": [], "doi": []}, {"id": "e42b89b6ed1c6d79286a62ded1e4c090f474eb40", "title": "Using image analytics to monitor retail store shelves", "year": "2015", "pdf": [], "doi": ["https://doi.org/10.1147/JRD.2015.2394513"]}, {"id": "64fb6a04a3ec96b2ad266c381c75f4dc16ce3460", "title": "Hole-based traffic sign detection method for traffic signs with red rim", "year": "2013", "pdf": [], "doi": ["https://doi.org/10.1007/s00371-013-0879-0"]}, {"id": "24c20c28871fa923c3f45b745b9b9f2d3d280e81", "title": "Harmony potentials for joint classification and segmentation", "year": "2010", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=5540048"]}, {"id": "06f1c079303937f6022e6157e6341c7921fe9428", "title": "Efficient Dense Rigid-Body Motion Segmentation and Estimation in RGB-D Video", "year": "2014", "pdf": ["http://ais.uni-bonn.de/papers/IJCV_2015_Stueckler_Motion_Segmentation.pdf", "http://www.ais.uni-bonn.de/papers/IJCV_2015_Stueckler_Motion_Segmentation.pdf"], "doi": ["https://doi.org/10.1007/s11263-014-0796-3"]}, {"id": "333b877ea761c5c1d4ffa39654fc19bd015e245d", "title": "Ontology-Based Semantic Image Segmentation Using Mixture Models and Multiple CRFs", "year": "2016", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=7450190"]}, {"id": "0ecaabbf846bbc78c91bf7ff71b998b61c0082d8", "title": "Automated Visual Fin Identification of Individual Great White Sharks", "year": "2016", "pdf": ["https://arxiv.org/pdf/1609.06323.pdf"], "doi": []}, {"id": "28863c0f3a1aa186bf1c281c73784cf36e2bf361", "title": "Efficient Non-iterative Domain Adaptation of Pedestrian Detectors to Video Scenes", "year": "2014", "pdf": ["http://eprints.whiterose.ac.uk/84865/1/ICPR14.pdf"], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=6976833", "http://doi.org/10.1109/ICPR.2014.123"]}, {"id": "054738ce39920975b8dcc97e01b3b6cc0d0bdf32", "title": "Towards the design of an end-to-end automated system for image and video-based recognition", "year": "2016", "pdf": ["https://arxiv.org/pdf/1601.07883.pdf"], "doi": []}, {"id": "4446924885545b255164b32e42b8375bac699f23", "title": "Object semantic categorization based on ensemble SVM classifiers", "year": "2016", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=7867229"]}, {"id": "fc2c39b6439623c00b10e8d9826b1c82e8487805", "title": "Generalized Semantic Preserving Hashing for N-Label Cross-Modal Retrieval", "year": "2017", "pdf": ["http://openaccess.thecvf.com/content_cvpr_2017/papers/Mandal_Generalized_Semantic_Preserving_CVPR_2017_paper.pdf"], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=8099765", "http://doi.ieeecomputersociety.org/10.1109/CVPR.2017.282", "http://doi.org/10.1109/CVPR.2017.282"]}, {"id": "92cd808bba43c3702d8cbddde65ee42bf01676d4", "title": "A MultiPath Network for Object Detection", "year": "2016", "pdf": ["https://arxiv.org/pdf/1604.02135.pdf"], "doi": []}, {"id": "3bccc5621b14f2e6b07a5936acecdf957724c6ff", "title": "Convolutional Fisher Kernels for RGB-D Object Recognition", "year": "2015", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=7335478", "http://doi.ieeecomputersociety.org/10.1109/3DV.2015.23", "http://doi.org/10.1109/3DV.2015.23"]}, {"id": "0b67879b1d5db9da12490b41b4f52d12626e87bc", "title": "The KIT object models database: An object model database for object recognition, localization and manipulation in service robotics", "year": "2012", "pdf": ["http://ijr.sagepub.com/content/31/8/927.full.pdf"], "doi": ["https://doi.org/10.1177/0278364912445831"]}, {"id": "98b4bf8cf8890f50b12e4fabe78bafd687a598c2", "title": "Semantic Labeling Based Vehicle Detection in Aerial Imagery", "year": "2018", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=8354178"]}, {"id": "e03a2299caf2febcc7b87ee4e61e78ad8cb24e45", "title": "Combined Holistic and Local Patches for Recovering 6D Object Pose", "year": "2017", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=8265469"]}, {"id": "26eadb307d62ab28713931beb8be9ff0f04c6ea0", "title": "Synthetic Viewpoint Prediction", "year": "2016", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=7801548", "http://doi.ieeecomputersociety.org/10.1109/CRV.2016.58", "http://doi.org/10.1109/CRV.2016.58"]}, {"id": "55d01b7314d78fe3bc5ae03b6e414ecba14188f8", "title": "Cognitive Inspired WOR Framework to Reveal Image Semantics, for Efficient Content Based Image Retrieval", "year": "2015", "pdf": [], "doi": ["http://dl.acm.org/citation.cfm?id=2709034"]}, {"id": "05e9e85b5137016c93d042170e82f77bb551a108", "title": "A Benchmark Dataset and Evaluation Methodology for Video Object Segmentation", "year": "2016", "pdf": ["http://www.cv-foundation.org/openaccess/content_cvpr_2016/papers/Perazzi_A_Benchmark_Dataset_CVPR_2016_paper.pdf", "https://graphics.ethz.ch/~perazzif/davis/files/davis.pdf", "https://graphics.ethz.ch/~perazzif/davis/files/davis_poster_cvpr_2016.pdf", "https://graphics.ethz.ch/~perazzif/davis/files/davis_supplementary.pdf"], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=7780454", "http://doi.ieeecomputersociety.org/10.1109/CVPR.2016.85", "http://doi.org/10.1109/CVPR.2016.85"]}, {"id": "64bff565c83c6ce3fac783d8d67191af99803701", "title": "Learning to Co-Generate Object Proposals with a Deep Structured Network", "year": "2016", "pdf": ["http://infoscience.epfl.ch/record/217984/files/HayderHeSalzmannCVPR16.pdf", "http://openaccess.thecvf.com/content_cvpr_2016/papers/Hayder_Learning_to_Co-Generate_CVPR_2016_paper.pdf", "http://www.cv-foundation.org/openaccess/content_cvpr_2016/papers/Hayder_Learning_to_Co-Generate_CVPR_2016_paper.pdf"], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=7780650", "http://doi.ieeecomputersociety.org/10.1109/CVPR.2016.281", "http://doi.org/10.1109/CVPR.2016.281"]}, {"id": "66dcc6771e35068a1ea2f6e6f4cdb9a40a4df450", "title": "A Linear Approximation to the chi^2 Kernel with Geometric Convergence", "year": "2012", "pdf": ["https://arxiv.org/pdf/1206.4074.pdf"], "doi": []}, {"id": "dbf2d57def648d1dae7717c92a32ff02157e5cb5", "title": "RedNet: Residual Encoder-Decoder Network for indoor RGB-D Semantic Segmentation", "year": "2018", "pdf": ["https://arxiv.org/pdf/1806.01054.pdf"], "doi": []}, {"id": "2284ba28bd3b1afaf06afb8c2a94638e350b3ecb", "title": "Boosting Object Proposals: From Pascal to COCO", "year": "2015", "pdf": ["http://openaccess.thecvf.com/content_iccv_2015/papers/Pont-Tuset_Boosting_Object_Proposals_ICCV_2015_paper.pdf", "http://www.cv-foundation.org/openaccess/content_iccv_2015/papers/Pont-Tuset_Boosting_Object_Proposals_ICCV_2015_paper.pdf", "http://www.vision.ee.ethz.ch/en/publications/papers/proceedings/eth_biwi_01226.pdf"], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=7410538", "http://doi.ieeecomputersociety.org/10.1109/ICCV.2015.181", "http://doi.org/10.1109/ICCV.2015.181"]}, {"id": "174b6d661b96840e27cd9435c2dbb8e538b2c8a6", "title": "Progressive Representation Adaptation for Weakly Supervised Object Localization", "year": "2017", "pdf": ["https://arxiv.org/pdf/1710.04647.pdf"], "doi": []}, {"id": "b95cdaaa0d6c191bcc8169ce555219ad545258fb", "title": "Online streaming feature selection: a minimum redundancy, maximum significance approach", "year": "2018", "pdf": [], "doi": ["https://doi.org/10.1007/s10044-018-0690-7"]}, {"id": "0f780a8cb09627bec41000345c2771df2853224a", "title": "Automatic inspection of aeronautic components", "year": "2017", "pdf": [], "doi": ["https://doi.org/10.1007/s00138-017-0839-1"]}, {"id": "c1206330ba57a27fd0acc29dd39825bbf2d91060", "title": "A Shape Reconstructability Measure of Object Part Importance with Applications to Object Detection and Localization", "year": "2014", "pdf": ["http://www.stat.ucla.edu/~yuille/Pubs10_12/PartImportance_IJCV2014_online.pdf"], "doi": ["https://doi.org/10.1007/s11263-014-0705-9"]}, {"id": "4c500c84e16e5ebb50b33f9bcff36854e5131c16", "title": "All-Transfer Learning for Deep Neural Networks and its Application to Sepsis Classification", "year": "2016", "pdf": ["https://arxiv.org/pdf/1711.04450.pdf"], "doi": []}, {"id": "02f86370fd467f0d03948a94a346034d8a111ffd", "title": "Semantic Video Retrieval Using High Level Context", "year": "2008", "pdf": ["https://pdfs.semanticscholar.org/02f8/6370fd467f0d03948a94a346034d8a111ffd.pdf"], "doi": []}, {"id": "d111faa1990f80e3351ea1eef0e5fc177d4e44b4", "title": "Iteratively Training Look-Up Tables for Network Quantization", "year": "2018", "pdf": ["https://arxiv.org/pdf/1811.05355.pdf"], "doi": []}, {"id": "165c27a4bfb56562c807279bef9d15f1bced5ca0", "title": "Scene parsing using inference Embedded Deep Networks", "year": "2016", "pdf": ["http://www.adv-ci.com/publications/2016_PR_Bu.pdf"], "doi": ["http://doi.org/10.1016/j.patcog.2016.01.027"]}, {"id": "f348d23a88fd81e05585897629f2f230fcfe77c7", "title": "Transfer Learning of Deep Neural Networks for Visual Collaborative Maritime Asset Identification", "year": "2018", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=8537839"]}, {"id": "87fe38a79ee12531bb618d4006a476b3a5256f3e", "title": "Relative Saliency and Ranking: Models, Metrics, Data, and Benchmarks", "year": "2018", "pdf": ["https://arxiv.org/pdf/1810.02426.pdf"], "doi": []}, {"id": "d8b8e165279ca2091d5af1440ed974db4792250f", "title": "Mean Response-Time Minimization of a Soft-Cascade Detector", "year": "2016", "pdf": ["https://pdfs.semanticscholar.org/ad73/ff39869e223dba6e0ee94481b6c32766df86.pdf"], "doi": []}, {"id": "0f6a2ea69c325bcbfca85fb05cb5f542873b1bf8", "title": "Food Recognition and Detection with Minimum Supervision", "year": "2016", "pdf": [], "doi": []}, {"id": "df8aee8aef6f0c71f968979318dafcd53da04bdc", "title": "Bending the Curve: Improving the ROC Curve Through Error Redistribution", "year": "2016", "pdf": ["https://arxiv.org/pdf/1605.06652.pdf"], "doi": []}, {"id": "70918453e9f147747b7a37d9159c8c1515a55ae4", "title": "Visual object tracking via the local soft cosine similarity", "year": "2018", "pdf": [], "doi": ["https://doi.org/10.1016/j.patrec.2018.03.026"]}, {"id": "1876095a9387a84e594d81675c9c2c17cb10f7cf", "title": "Accurate segmentation of complex document image using digital shearlet transform with neutrosophic set as uncertainty handling tool", "year": "2017", "pdf": ["http://fs.gallup.unm.edu/neut/AccurateSegmentationOfComplex.pdf"], "doi": ["http://doi.org/10.1016/j.asoc.2017.08.005"]}, {"id": "ad52d047a44f20416f9dd6655cef54169d481454", "title": "Perceptual modeling in the problem of active object recognition in visual scenes", "year": "2016", "pdf": [], "doi": ["http://doi.org/10.1016/j.patcog.2016.03.007"]}, {"id": "e096b11b3988441c0995c13742ad188a80f2b461", "title": "DeepProposals: Hunting Objects and Actions by Cascading Deep Convolutional Layers", "year": "2017", "pdf": ["https://arxiv.org/pdf/1606.04702.pdf"], "doi": []}, {"id": "56e95fa26fb417776824e5adf6d6d511e5b30110", "title": "Object and Action Classification with Latent Window Parameters", "year": "2013", "pdf": ["http://homepages.inf.ed.ac.uk/hbilen/assets/pdf/Bilen14.pdf", "http://www.cse.iitk.ac.in/users/cs365/2014/_papers/bilen-namboodri-vanGool-13_object-action-classify-latent-windows.pdf", "http://www.cse.iitk.ac.in/users/vinaypn/papers/bilen2013ijcv.pdf"], "doi": ["http://doi.org/10.1007/s11263-013-0646-8"]}, {"id": "e7df750805d6c025d0a1a74a05a83bcf8cc63dd7", "title": "Assessment of crowdsourcing and gamification loss in user-assisted object segmentation", "year": "2015", "pdf": ["http://upcommons.upc.edu/bitstream/handle/2117/81293/asknseek.pdf;jsessionid=469B72384B7C56D4A331D68A53942294?sequence=1"], "doi": ["https://doi.org/10.1007/s11042-015-2897-6"]}, {"id": "85eedee59aca5f2a591265a2173cf3a2799cdc94", "title": "Action and Event Recognition with Fisher Vectors on a Compact Feature Set", "year": "2013", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=6751336"]}, {"id": "3463aeda3a8d33bc88d8383cc4ad451a6775c75a", "title": "Understanding Indoor Scenes Using 3D Geometric Phrases", "year": "2013", "pdf": ["http://courses.cs.washington.edu/courses/cse590v/13au/choi_cvpr13.pdf", "http://vigir.missouri.edu/~gdesouza/Research/Conference_CDs/IEEE_CVPR2013/data/Papers/4989a033.pdf", "http://www.cv-foundation.org/openaccess/content_cvpr_2013/papers/Choi_Understanding_Indoor_Scenes_2013_CVPR_paper.pdf", "https://static.googleusercontent.com/media/research.google.com/en//pubs/archive/41340.pdf"], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=6618856", "http://doi.ieeecomputersociety.org/10.1109/CVPR.2013.12", "http://doi.org/10.1109/CVPR.2013.12"]}, {"id": "70b420850e16ec2afe42d5c0006742d9045b3e7f", "title": "If You Can't Beat Them, Join Them: Learning with Noisy Data", "year": "2015", "pdf": [], "doi": ["http://dl.acm.org/citation.cfm?id=2806231"]}, {"id": "985b6a10c1bb9c8908d6d299c7ab0bba76df2259", "title": "Dense Decoder Shortcut Connections for Single-Pass Semantic Segmentation", "year": "2018", "pdf": ["http://openaccess.thecvf.com/content_cvpr_2018/papers/Bilinski_Dense_Decoder_Shortcut_CVPR_2018_paper.pdf"], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=8578788", "http://doi.ieeecomputersociety.org/10.1109/CVPR.2018.00690", "http://doi.org/10.1109/CVPR.2018.00690"]}, {"id": "82451d0ae2e0154b5f9cd096af199c35319e911a", "title": "Image spam filtering using convolutional neural networks", "year": "2018", "pdf": [], "doi": ["http://doi.org/10.1007/s00779-018-1168-8"]}, {"id": "8ff6294535acf46abf523b879f20685de0692a8c", "title": "Bayes Risk for Large Scale Hierarchical Top-K Image Classification", "year": "2013", "pdf": ["https://www.research-collection.ethz.ch/bitstream/handle/20.500.11850/153936/eth-6877-01.pdf?isAllowed=y&sequence=1"], "doi": ["https://doi.org/10.3929/ethz-a-009767867"]}, {"id": "d97224063697392f073e467005e89973d2be7d65", "title": "Recherche de motifs fr\u00e9quents dans une base de cartes combinatoires. (Frequent pattern discovery in combinatorial maps databases)", "year": "2011", "pdf": ["https://pdfs.semanticscholar.org/02d1/8e600804a1a6ff354856d8dcb80ceb4c8a43.pdf"], "doi": []}, {"id": "74a1336f1fbc8b7bb3b6e159711af1a91336ce22", "title": "An overview of traffic sign detection methods", "year": "2010", "pdf": ["https://pdfs.semanticscholar.org/74a1/336f1fbc8b7bb3b6e159711af1a91336ce22.pdf"], "doi": []}, {"id": "e33bc0cd79d92d6868989a29c3ab06b75f808590", "title": "Deep Nets: What have they ever done for Vision?", "year": "2018", "pdf": ["https://arxiv.org/pdf/1805.04025.pdf"], "doi": []}, {"id": "0b4d3e59a0107f0dad22e74054bab1cf1ad9c32e", "title": "Visual Genome: Connecting Language and Vision Using Crowdsourced Dense Image Annotations", "year": "2016", "pdf": ["https://arxiv.org/pdf/1602.07332.pdf"], "doi": []}, {"id": "14d1a458f49e251cbbab34349e379469300a2bae", "title": "Scene Parsing with Object Instances and Occlusion Ordering", "year": "2014", "pdf": ["http://slazebni.cs.illinois.edu/publications/jtighe-cvpr14.pdf", "http://www.cv-foundation.org/openaccess/content_cvpr_2014/papers/Tighe_Scene_Parsing_with_2014_CVPR_paper.pdf", "http://wwwx.cs.unc.edu/~mn/sites/default/files/jtighe-cvpr14.pdf"], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=6909874", "http://doi.ieeecomputersociety.org/10.1109/CVPR.2014.479", "http://doi.org/10.1109/CVPR.2014.479"]}, {"id": "a6cd743c29667ab5baef9d66d6558247b1cd00b0", "title": "New in-situ training image and one-shot detection model without adaptation GENETIM detection model for synset bottle", "year": "2014", "pdf": ["https://pdfs.semanticscholar.org/a6cd/743c29667ab5baef9d66d6558247b1cd00b0.pdf"], "doi": []}, {"id": "9b8746e9480c3bdcaa6efca33096369422c624aa", "title": "Algae Detection Using Computer Vision and Deep Learning", "year": "2018", "pdf": ["https://arxiv.org/pdf/1811.10847.pdf"], "doi": []}, {"id": "3325860c0c82a93b2eac654f5324dd6a776f609e", "title": "2D Human Pose Estimation: New Benchmark and State of the Art Analysis", "year": "2014", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=6909866"]}, {"id": "896e2776174dcb86d311789ab83a266151d0595b", "title": "A Novel Performance Evaluation Methodology for Single-Target Trackers", "year": "2016", "pdf": ["https://arxiv.org/pdf/1503.01313.pdf"], "doi": []}, {"id": "bf26ccc92bca086195c5f250aef2e409a1c7cd85", "title": "Local Bayes Risk Minimization Based Stopping Strategy for Hierarchical Classification", "year": "2017", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=8215524", "http://doi.ieeecomputersociety.org/10.1109/ICDM.2017.61", "http://doi.org/10.1109/ICDM.2017.61"]}, {"id": "ff3a9545e73adea5275a1c7c71c5e3fe2e35a9a1", "title": "An Enhanced Feature Extraction Technique for Diagnosis of Pathological Problems in Mango Crop", "year": "2017", "pdf": ["https://pdfs.semanticscholar.org/ff3a/9545e73adea5275a1c7c71c5e3fe2e35a9a1.pdf"], "doi": []}, {"id": "21d1225296aad388406824eb113715c4b90ed3da", "title": "Dirichlet-Based Concentric Circle Feature Transform for Breast Mass Classification", "year": "2015", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=7372146", "http://doi.ieeecomputersociety.org/10.1109/ICTAI.2015.50", "http://doi.org/10.1109/ICTAI.2015.50"]}, {"id": "3f0b0ffe315ee111fc028561ec4ecf2c93f94a05", "title": "Pose Normalization Network for Object Classification", "year": "2017", "pdf": ["https://pdfs.semanticscholar.org/3f0b/0ffe315ee111fc028561ec4ecf2c93f94a05.pdf"], "doi": []}, {"id": "75b987f86af2bc7f68edc45be240dd30e1ef2699", "title": "Sampling Algorithms to Handle Nuisances in Large-Scale Recognition", "year": "2017", "pdf": ["https://pdfs.semanticscholar.org/75b9/87f86af2bc7f68edc45be240dd30e1ef2699.pdf"], "doi": []}, {"id": "6a405e7284ff7e2127a241d60646b4abd3da92f2", "title": "Generate To Adapt : Unsupervised Domain Adaptation using Generative Adversarial Networks", "year": "2017", "pdf": [], "doi": []}, {"id": "c0e551acb063c9cd73dea28ab8963f850b6f1148", "title": "A Comparison of Techniques based on Image Classification and Object Detection to Count Cars and Non-empty Stalls in Parking Spaces", "year": "2018", "pdf": ["https://pdfs.semanticscholar.org/c0e5/51acb063c9cd73dea28ab8963f850b6f1148.pdf"], "doi": []}, {"id": "8b45a87f3dfc8eccd745161effbf2457a9097e6a", "title": "WEAKLY SUPERVISED SEMANTIC SEGMENTATION 3 priors can give good pixel labelling results", "year": "2017", "pdf": [], "doi": []}, {"id": "25d75339720787e7003f2f103cf38cee8175972a", "title": "Optimistic and Pessimistic Neural Networks for Scene and Object Recognition", "year": "2016", "pdf": ["https://arxiv.org/pdf/1609.07982.pdf"], "doi": []}, {"id": "12d9a4233a16ea08fbb1de853b6a97b4f4952c23", "title": "Tractable Structured Prediction using the Permutohedral Lattice", "year": "2017", "pdf": ["https://www.research-collection.ethz.ch/bitstream/handle/20.500.11850/130429/eth-50807-01.pdf?isAllowed=y&sequence=1", "https://www.research-collection.ethz.ch/bitstream/handle/20.500.11850/130429/eth-50807-02.pdf?isAllowed=y&sequence=2"], "doi": ["https://doi.org/10.3929/ethz-a-010882665"]}, {"id": "33d101fe276fd5e6220c9b40c33e1a1d1389e5bb", "title": "DOC: DEEP OCCLUSION ESTIMATION FROM A SIN-", "year": "2016", "pdf": [], "doi": []}, {"id": "c6c691b772822881c5c52b779100928f0d54fdd7", "title": "Using Visual Saliency to Improve Human Detection with Convolutional Networks", "year": "2018", "pdf": [], "doi": []}, {"id": "11a3084768f035c824662a85a348f02466693d2a", "title": "Lifting Object Detection Datasets into 3D", "year": "2016", "pdf": ["https://arxiv.org/pdf/1503.06465.pdf"], "doi": []}, {"id": "4be10db13a9210e078d78a4a072c569d9bbd9939", "title": "Seed, Expand and Constrain: Three Principles for Weakly-Supervised Image Segmentation", "year": "2016", "pdf": ["https://arxiv.org/pdf/1603.06098.pdf"], "doi": []}, {"id": "18a849b1f336e3c3b7c0ee311c9ccde582d7214f", "title": "Efficiently Scaling Up Crowdsourced Video Annotation A Set of Best Practices for High Quality , Economical Video Labeling", "year": "2012", "pdf": ["https://pdfs.semanticscholar.org/18a8/49b1f336e3c3b7c0ee311c9ccde582d7214f.pdf"], "doi": []}, {"id": "13e424d502bf539108ad6f5cc877cfb1255dbee0", "title": "Improving Vision-Based Self-Positioning in Intelligent Transportation Systems via Integrated Lane and Vehicle Detection", "year": "2015", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=7045914"]}, {"id": "1dbd7653ede6af15d539f64cb2128752ca029e44", "title": "Hollywood 3D: Recognizing Actions in 3D Natural Scenes", "year": "2013", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=6619280"]}, {"id": "f4c45108cb41051010d8a5175b8da23eb246c967", "title": "Improving Image Captioning by Leveraging Knowledge Graphs", "year": "2019", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=8658870"]}, {"id": "1b3ee5455956a40c6e9e09ccda0f4fb162838629", "title": "The Recognition of License Plate Restrictions Based on Faster R-CNN", "year": "2018", "pdf": ["https://pdfs.semanticscholar.org/1b3e/e5455956a40c6e9e09ccda0f4fb162838629.pdf"], "doi": []}, {"id": "5c45a1abc51fe059987bcfba19b1d5076a8d9afb", "title": "Autonomous Object Category Learning for Service Robots Using Internet Resources", "year": "2016", "pdf": ["https://pdfs.semanticscholar.org/5c45/a1abc51fe059987bcfba19b1d5076a8d9afb.pdf"], "doi": []}, {"id": "4a31b3fcc346bf3235efe1c0fb310833570cef27", "title": "Learning Intelligent Dialogs for Bounding Box Annotation", "year": "2018", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=8579054"]}, {"id": "ed62a56b81511d7fcf6d247014987163d9668982", "title": "\"What happens if...\" Learning to Predict the Effect of Forces in Images", "year": "2016", "pdf": ["https://arxiv.org/pdf/1603.05600.pdf"], "doi": []}, {"id": "29aa3dc15450e6eb46c34f30f0e224e5ea16615e", "title": "Sketch Me That Shoe", "year": "2016", "pdf": ["http://openaccess.thecvf.com/content_cvpr_2016/papers/Yu_Sketch_Me_That_CVPR_2016_paper.pdf", "http://vision.cs.utexas.edu/381V-fall2016/slides/hsiao_paper.pdf", "http://www.cv-foundation.org/openaccess/content_cvpr_2016/papers/Yu_Sketch_Me_That_CVPR_2016_paper.pdf", "https://www.eecs.qmul.ac.uk/~qian/SketchMeThatShoe.pdf"], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=7780462", "http://doi.ieeecomputersociety.org/10.1109/CVPR.2016.93", "http://doi.org/10.1109/CVPR.2016.93"]}, {"id": "1999d5e0700bf8fa50bb1bab5b981bda1d111a4f", "title": "Monocular Road Terrain Detection by Combining Visual and Spatial Information", "year": "2014", "pdf": ["https://pdfs.semanticscholar.org/73b1/10df4809d0a015f90fa6e7a7dce351bcc52e.pdf", "https://www.researchgate.net/profile/Jannik_Fritsch/publication/261073577_Monocular_Road_Terrain_Detection_by_Combining_Visual_and_Spatial_Information/links/5475ef240cf29afed612e5a8.pdf"], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=6766705", "http://doi.org/10.1109/TITS.2014.2303899"]}, {"id": "34072c31c2c778df471c9f0c43ba6198dfd0db32", "title": "Arbitrary Category Classification of Websites Based on Image Content", "year": "2015", "pdf": ["http://users.ics.aalto.fi/juha/papers/ELM2014.pdf", "http://www.engineering.uiowa.edu/sites/default/files/files/newpaper.pdf"], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=7083681", "http://doi.org/10.1109/MCI.2015.2405317"]}, {"id": "d23ac99cdab20a9a3eca2784a5b262649c717988", "title": "Rotation Invariant Angular Descriptor Via A Bandlimited Gaussian-like Kernel", "year": "2016", "pdf": ["https://arxiv.org/pdf/1606.02753.pdf"], "doi": []}, {"id": "22cf367d14e646914cc959bbcd402df0c20cd0dc", "title": "Towards Automated Melanoma Screening: Proper Computer Vision & Reliable Results", "year": "2016", "pdf": ["https://arxiv.org/pdf/1604.04024.pdf"], "doi": []}, {"id": "c9d73438bf5e66bd0c4f512c5a4e53c3e33e721e", "title": "Adding spatial distribution clue to aggregated vector in image retrieval", "year": "2018", "pdf": ["https://jivp-eurasipjournals.springeropen.com/track/pdf/10.1186/s13640-018-0247-0?site=jivp-eurasipjournals.springeropen.com"], "doi": ["http://doi.org/10.1186/s13640-018-0247-0"]}, {"id": "a74b045f28670e8f85173e0e483581520d667f02", "title": "Object tracking using Langevin Monte Carlo particle filter and locality sensitive histogram based likelihood model", "year": "2018", "pdf": [], "doi": ["http://doi.org/10.1016/j.cag.2017.07.023"]}, {"id": "c56da136b8d62125009a131f6dc21fcd0dd6a559", "title": "ICDAR2017 Robust Reading Challenge on Text Extraction from Biomedical Literature Figures (DeTEXT)", "year": "2017", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=8270166", "http://doi.ieeecomputersociety.org/10.1109/ICDAR.2017.235", "http://doi.org/10.1109/ICDAR.2017.235"]}, {"id": "02e5372e439c09f8a8ce8c4784b044ce116ca11c", "title": "DeepCorrect: Correcting DNN models against Image Distortions", "year": "2017", "pdf": ["https://arxiv.org/pdf/1705.02406.pdf"], "doi": []}, {"id": "e8b2a98f87b7b2593b4a046464c1ec63bfd13b51", "title": "CMS-RCNN: Contextual Multi-Scale Region-based CNN for Unconstrained Face Detection", "year": "2016", "pdf": ["https://arxiv.org/pdf/1606.05413.pdf"], "doi": []}, {"id": "5fdbebf417da2427744d2c60f413b5375e68993e", "title": "Discriminative Sub-categorization", "year": "2013", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=6619062"]}, {"id": "32bebe84ffbd4fd81f0e5bb30dbc90774aa3b14b", "title": "Segmentation Results Stimuli Final Saliency Map Ground Truth Constructed Graph CCA", "year": "2017", "pdf": ["https://pdfs.semanticscholar.org/32be/be84ffbd4fd81f0e5bb30dbc90774aa3b14b.pdf"], "doi": []}, {"id": "a02e5d8e2a10176dc5e2566e1b492823a0cb6ee2", "title": "A learning framework for higher-order consistency models in multi-class pixel labeling problems", "year": "2014", "pdf": [], "doi": []}, {"id": "383d64b27fb3cdf2beff43f3beb8caac8c21a886", "title": "Detecting activities of daily living in first-person camera views", "year": "2012", "pdf": ["http://people.csail.mit.edu/hpirsiav/papers/adl_cvpr12.pdf", "http://people.csail.mit.edu/hpirsiav/papers/adl_cvpr12_poster.pdf", "http://people.csail.mit.edu/hpirsiav/papers/adl_cvpr12_slides.pdf", "http://vision.ics.uci.edu/papers/PirsiavashR_CVPR_2012_1/PirsiavashR_CVPR_2012_1.pdf", "http://web.cs.hacettepe.edu.tr/~erkut/bil722.f12/w06-cagdas.pdf", "http://www.cs.utexas.edu/~cv-fall2012/slides/dinesh-expt.pdf", "http://www.ics.uci.edu/~dramanan/papers/ADL_2012.pdf", "https://www.cs.cmu.edu/~deva/papers/ADL_2012.pdf", "https://www.csee.umbc.edu/~hpirsiav/papers/adl_cvpr12.pdf"], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=6248010", "http://doi.ieeecomputersociety.org/10.1109/CVPR.2012.6248010", "http://doi.org/10.1109/CVPR.2012.6248010"]}, {"id": "5e0f8c355a37a5a89351c02f174e7a5ddcb98683", "title": "Microsoft COCO: Common Objects in Context", "year": "2014", "pdf": ["https://arxiv.org/pdf/1405.0312.pdf"], "doi": []}, {"id": "64c1158a4061882d610f1cffd5ddb1e8fc9a74b4", "title": "Gated Feedback Refinement Network for Dense Image Labeling", "year": "2017", "pdf": ["http://openaccess.thecvf.com/content_cvpr_2017/papers/Islam_Gated_Feedback_Refinement_CVPR_2017_paper.pdf", "http://www.cs.umanitoba.ca/~ywang/papers/cvpr17.pdf"], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=8100001", "http://doi.ieeecomputersociety.org/10.1109/CVPR.2017.518", "http://doi.org/10.1109/CVPR.2017.518"]}, {"id": "284be8be0c6bedc36dfe43229bc84345ab0aedc2", "title": "Faster Training of Mask R-CNN by Focusing on Instance Boundaries", "year": "2018", "pdf": ["https://arxiv.org/pdf/1809.07069.pdf"], "doi": []}, {"id": "be2d326fa588b4ffd1d8d3d4408ae680e1a26277", "title": "JOURNA A Survey on Modern Era \u2019 s Online Object Tracking Algorithms", "year": "2013", "pdf": ["https://pdfs.semanticscholar.org/be2d/326fa588b4ffd1d8d3d4408ae680e1a26277.pdf"], "doi": []}, {"id": "2a2232f2972191a0606d588aa4f13c9f27d1972d", "title": "InstanceCut: From Edges to Instances with MultiCut", "year": "2017", "pdf": ["https://arxiv.org/pdf/1611.08272.pdf"], "doi": []}, {"id": "029cabb6f3f6a824590e735feb1d8557646db8a6", "title": "One-Bit Object Detection: On learning to localize objects with minimal supervision", "year": "2014", "pdf": ["https://arxiv.org/pdf/1403.1024.pdf"], "doi": []}, {"id": "fd23dda0abe2d6a3ae0c8253c89110364cdecbc9", "title": "Deep Learning for People Detection on Beach Images", "year": "2018", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=8575616", "http://doi.ieeecomputersociety.org/10.1109/BRACIS.2018.00045", "http://doi.org/10.1109/BRACIS.2018.00045"]}, {"id": "c3c4f0caf1b42b6466306360c4ebe16f66489df0", "title": "Gated Feedback Refinement Network for Coarse-to-Fine Dense Semantic Image Labeling", "year": "2018", "pdf": ["https://arxiv.org/pdf/1806.11266.pdf"], "doi": []}, {"id": "03fd6774f57aaed9320060e4527121c59e9eca2b", "title": "Intrinsic spatial pyramid matching for deformable 3D shape retrieval", "year": "2013", "pdf": [], "doi": ["https://doi.org/10.1007/s13735-013-0041-9"]}, {"id": "304aa9bfd6bc32d3d87abce6a229d973270bbd73", "title": "Fast Neural Cell Detection Using Light-Weight SSD Neural Network", "year": "2017", "pdf": ["http://openaccess.thecvf.com/content_cvpr_2017_workshops/w8/papers/Yi_Fast_Neural_Cell_CVPR_2017_paper.pdf"], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=8014853", "http://doi.ieeecomputersociety.org/10.1109/CVPRW.2017.119", "http://doi.org/10.1109/CVPRW.2017.119"]}, {"id": "c8ba499e8d8daa32637885f03137f41d61023bf9", "title": "Weak supervision for detecting object classes from activities", "year": "2017", "pdf": ["https://ps.is.tue.mpg.de/uploads_file/attachment/attachment/296/weak_supervision_object_detection.pdf"], "doi": ["http://doi.org/10.1016/j.cviu.2016.09.006"]}, {"id": "cd1a636c1261208084cb8395c877c7ca22c76df1", "title": "Fast Deep Vehicle Detection in Aerial Images", "year": "2017", "pdf": ["https://www.computer.org/csdl/proceedings/wacv/2017/4822/00/07926624.pdf"], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=7926624", "http://doi.org/10.1109/WACV.2017.41"]}, {"id": "101c7305f141145c4d168dfa40284e0ad86a0d9b", "title": "Active Object Localization with Deep Reinforcement Learning", "year": "2015", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=7410643"]}, {"id": "48922520e6de0954a83f26977b2b50b7fbfdcf61", "title": "A survey of sketch-based image retrieval", "year": "2018", "pdf": [], "doi": ["https://doi.org/10.1007/s00138-018-0953-8"]}, {"id": "c37fe13f94dfc2f3494a35a63336689ce4392135", "title": "MPNET: An End-to-End Deep Neural Network for Object Detection in Surveillance Video", "year": "2018", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=8365094", "http://doi.org/10.1109/ACCESS.2018.2836921"]}, {"id": "0f8f9253c81fd90fe44d474cc185d4ae2487e5b4", "title": "NYC3DCars: A Dataset of 3D Vehicles in Geographic Context", "year": "2013", "pdf": ["http://nyc3d.cs.cornell.edu/static/paper.pdf", "http://www.cs.cornell.edu/~snavely/publications/papers/nyc3dcars_iccv13.pdf", "http://www.cv-foundation.org/openaccess/content_iccv_2013/papers/Matzen_NYC3DCars_A_Dataset_2013_ICCV_paper.pdf"], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=6751204", "http://doi.ieeecomputersociety.org/10.1109/ICCV.2013.99", "http://doi.org/10.1109/ICCV.2013.99"]}, {"id": "e8ffef3d4d74720e766e506e175e533bdc8ee705", "title": "Object Detection Networks on Convolutional Feature Maps", "year": "2017", "pdf": ["https://arxiv.org/pdf/1504.06066.pdf"], "doi": []}, {"id": "1daf971c087f5e21dbae831231377cbe9bb2f188", "title": "Incorporating Structural Alternatives and Sharing into Hierarchy for Multiclass Object Recognition and Detection", "year": "2013", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=6619272"]}, {"id": "8d74fbd46f9d5d615e350c4593cbc5b5ca63fa8b", "title": "Data driven visual tracking via representation learning and online multi-class LPBoost learning", "year": "2016", "pdf": [], "doi": ["http://doi.org/10.1049/iet-cvi.2014.0388"]}, {"id": "7af667b6c1b4b32f513dd70fe3ef36fcf344a741", "title": "A transfer learning based approach for automated grading of Gliomas using deep Residual Networks", "year": "2018", "pdf": ["https://pdfs.semanticscholar.org/7af6/67b6c1b4b32f513dd70fe3ef36fcf344a741.pdf"], "doi": []}, {"id": "d9dafc343727db2b6060c868d748f97eff6bac7d", "title": "Improved pedestrian detection using motion segmentation and silhouette orientation", "year": "2017", "pdf": [], "doi": ["http://doi.org/10.1007/s11042-017-4933-1"]}, {"id": "3b304585d5af0afe98a85d6e0559315fbf3a7807", "title": "An Improved Labelling for the INRIA Person Data Set for Pedestrian Detection", "year": "2013", "pdf": ["http://welcome.isr.ist.utl.pt/img/pdfs/2999_2013_IbPRIA_Taiana_Nascimento_Bernardino.pdf", "http://welcome.isr.tecnico.ulisboa.pt/wp-content/uploads/2015/05/2999_2013_IbPRIA_Taiana_Nascimento_Bernardino.pdf"], "doi": ["http://doi.org/10.1007/978-3-642-38628-2_34"]}, {"id": "99df9e95b3f3d187636918a65277baf7c98cbfc5", "title": "An efficient subsequence search for video anomaly detection and localization", "year": "2015", "pdf": [], "doi": ["https://doi.org/10.1007/s11042-015-2453-4", "https://www.wikidata.org/entity/Q56907428"]}, {"id": "832246357de85108cb910e773c203997448c570a", "title": "Recurrently Target-Attending Tracking", "year": "2016", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=7780530"]}, {"id": "74031f12dde0be772a742b96bf5f4c8d9fa41ec7", "title": "Joint Object-Material Category Segmentation from Audio-Visual Cues", "year": "2015", "pdf": ["https://arxiv.org/pdf/1601.02220.pdf"], "doi": []}, {"id": "9452d029f5d140aece06619b6fd8e47b070cacd1", "title": "Urban classification by pixel and object-based approaches for very high resolution imagery", "year": "2017", "pdf": ["https://pdfs.semanticscholar.org/9452/d029f5d140aece06619b6fd8e47b070cacd1.pdf"], "doi": []}, {"id": "7268747251a61d1ce3285baade15c372d4c566d6", "title": "Person Attribute Recognition with a Jointly-Trained Holistic CNN Model", "year": "2015", "pdf": ["http://web-info8.informatik.rwth-aachen.de/media/papers/sudowe_spitzer_leibe_ICCV_LaP_2015.pdf", "http://www.cv-foundation.org/openaccess/content_iccv_2015_workshops/w11/papers/Sudowe_Person_Attribute_Recognition_ICCV_2015_paper.pdf"], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=7406400", "http://doi.ieeecomputersociety.org/10.1109/ICCVW.2015.51", "http://doi.org/10.1109/ICCVW.2015.51"]}, {"id": "81763bb718dc6630be210c056a250b1c2ed57fd7", "title": "3D Semantic Parsing of Large-Scale Indoor Spaces", "year": "2016", "pdf": ["http://buildingparser.stanford.edu/images/CVPR_2016_poster.pdf", "http://buildingparser.stanford.edu/images/supp_mat.pdf", "http://openaccess.thecvf.com/content_cvpr_2016/papers/Armeni_3D_Semantic_Parsing_CVPR_2016_paper.pdf", "http://www.cv-foundation.org/openaccess/content_cvpr_2016/papers/Armeni_3D_Semantic_Parsing_CVPR_2016_paper.pdf"], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=7780539", "http://doi.ieeecomputersociety.org/10.1109/CVPR.2016.170", "http://doi.org/10.1109/CVPR.2016.170"]}, {"id": "9d5db7427b44d83bf036ff4cff382c23c6c7b6d8", "title": "Video redaction: a survey and comparison of enabling technologies", "year": "2017", "pdf": ["https://pdfs.semanticscholar.org/f78d/6d092deaafee550fb58d6ea6e8b559325876.pdf"], "doi": []}, {"id": "a228ba020bd321d29ab24485cb2988a62707fd64", "title": "Using objective ground-truth labels created by multiple annotators for improved video classification: A comparative study", "year": "2013", "pdf": ["https://engineering.purdue.edu/RVL/Publications/Srivastava2013.pdf"], "doi": ["http://doi.org/10.1016/j.cviu.2013.06.009"]}, {"id": "037f2e9d2d2aa15c3d476f4aa358da96707b4b44", "title": "Square Localization for Efficient and Accurate Object Detection", "year": "2015", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=7410651"]}, {"id": "bf3aae7293f664d512c0904916d804327af22f52", "title": "STDnet: A ConvNet for Small Target Detection", "year": "2018", "pdf": ["https://pdfs.semanticscholar.org/bf3a/ae7293f664d512c0904916d804327af22f52.pdf"], "doi": []}, {"id": "d6b514a68abff3ab14af9fc0152cd5b28bd0192c", "title": "Instance Segmentation by Deep Coloring", "year": "2018", "pdf": ["https://arxiv.org/pdf/1807.10007.pdf"], "doi": []}, {"id": "0de46e6768acaa71745406d646573644b975dc62", "title": "Scene-Domain Active Part Models for Object Representation", "year": "2015", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=7410644"]}, {"id": "e24792ec2a6cb8971b2f6befb4b97b9fe2d79952", "title": "Bottom-up Object Detection by Grouping Extreme and Center Points", "year": "2019", "pdf": ["https://arxiv.org/pdf/1901.08043.pdf"], "doi": []}, {"id": "1d7029a974f950de61f3980704956b43f1a06e7b", "title": "Efficient Optimization for Rank-Based Loss Functions", "year": "2018", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=8578487"]}, {"id": "22a8b7ca2e6449cad31ae4f71bb3587751087e77", "title": "DeepBox: Learning Objectness with Convolutional Networks", "year": "2015", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=7410642"]}, {"id": "9c4365a56fb3cf41b15712657b15f7422ca0dab2", "title": "A Hybrid Supervised-Unsupervised Vocabulary Generation Algorithm for Visual Concept Recognition", "year": "2010", "pdf": ["https://pdfs.semanticscholar.org/9c43/65a56fb3cf41b15712657b15f7422ca0dab2.pdf"], "doi": []}, {"id": "37b9ea1bf5b6ce8ecb656628af3933c64c632c2b", "title": "Transfer Learning for 3 D LiDAR-based Human Classification with a Mobile Robot", "year": "2018", "pdf": [], "doi": []}, {"id": "f79c4bf83371627ba139b61eb427463b93cd687b", "title": "Learning from Few Examples for Visual Recognition Problems", "year": "2011", "pdf": ["https://pdfs.semanticscholar.org/f79c/4bf83371627ba139b61eb427463b93cd687b.pdf"], "doi": []}, {"id": "084bd219dd239dc4c9a02621a5333d3bc1446566", "title": "DeepTrack: Learning Discriminative Feature Representations Online for Robust Visual Tracking", "year": "2015", "pdf": ["https://arxiv.org/pdf/1503.00072.pdf"], "doi": []}, {"id": "1c9da6cef6b1be9c116b26dd52c341c0adcf7db2", "title": "Interactive Perception: Leveraging Action in Perception and Perception in Action", "year": "2017", "pdf": ["https://arxiv.org/pdf/1604.03670.pdf"], "doi": []}, {"id": "549c719c4429812dff4d02753d2db11dd490b2ae", "title": "YouTube-BoundingBoxes: A Large High-Precision Human-Annotated Data Set for Object Detection in Video", "year": "2017", "pdf": ["https://arxiv.org/pdf/1702.00824.pdf"], "doi": []}, {"id": "e430d1ae3a28ec342f767cdfb19aeb76c20a3f21", "title": "Fast and Accurate, Convolutional Neural Network Based Approach for Object Detection from UAV", "year": "2018", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=8592805"]}, {"id": "3b4ad6b789837a6a878f33c0b7ddb1b1fc7daaf8", "title": "Fine-grained recognition of plants from images", "year": "2017", "pdf": ["https://plantmethods.biomedcentral.com/track/pdf/10.1186/s13007-017-0265-4?site=plantmethods.biomedcentral.com"], "doi": ["https://doi.org/10.1186/s13007-017-0265-4", "https://www.ncbi.nlm.nih.gov/pubmed/29299049"]}, {"id": "f92ceb6875f614bbccb25e4b11ca55353773890f", "title": "Saliency Detection via Boundary Prior and Center Prior", "year": "2017", "pdf": ["https://pdfs.semanticscholar.org/f92c/eb6875f614bbccb25e4b11ca55353773890f.pdf"], "doi": []}, {"id": "828b73e8a4d539eeae82601b5f5a4392818c6430", "title": "Long-Term Tracking by Decision Making", "year": "2017", "pdf": ["https://pdfs.semanticscholar.org/828b/73e8a4d539eeae82601b5f5a4392818c6430.pdf"], "doi": []}, {"id": "2114b25727a21275e88e30dad0423752f6047dae", "title": "Generic Visual Recognition on Non-Uniform Distributions Based on AdaBoost Codebooks", "year": "2011", "pdf": ["https://pdfs.semanticscholar.org/cac0/c534e02784a3a873690d213dd8c92b81992f.pdf"], "doi": []}, {"id": "7cb4d30b3bfb0d4b02499c15c7c7a9dfddda8049", "title": "Object Tracking using L 1 / L 2 Sparse Coding and Multi Scale Max Pooling", "year": "2014", "pdf": ["https://pdfs.semanticscholar.org/7cb4/d30b3bfb0d4b02499c15c7c7a9dfddda8049.pdf"], "doi": []}, {"id": "b7efecec654acd8831d045e728b54356c697c9c8", "title": "Learning Semantic Segmentation with Diverse Supervision", "year": "2018", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=8354268"]}, {"id": "eacb95e81156c48f4ff7470567ba205225170fa7", "title": "Learning Aerial Image Segmentation From Online Maps", "year": "2017", "pdf": ["https://arxiv.org/pdf/1707.06879.pdf"], "doi": []}, {"id": "14b311b848b51b7b5345573a289b1cedcbb4d581", "title": "Instance Similarity Deep Hashing for Multi-Label Image Retrieval", "year": "2018", "pdf": ["https://arxiv.org/pdf/1803.02987.pdf"], "doi": []}, {"id": "24ff832171cb774087a614152c21f54589bf7523", "title": "Beat-Event Detection in Action Movie Franchises", "year": "2015", "pdf": ["https://arxiv.org/pdf/1508.03755.pdf"], "doi": []}, {"id": "ffd73d1956163a4160ec2c96b3ab256f79fc92e8", "title": "Attributes as Semantic Units between Natural Language and Visual Recognition", "year": "2016", "pdf": ["https://arxiv.org/pdf/1604.03249.pdf"], "doi": []}, {"id": "99c37dba394b100ba8f3d895c0ee0e57d5852347", "title": "Are Cars Just 3D Boxes? Jointly Estimating the 3D Shape of Multiple Objects", "year": "2014", "pdf": ["http://openaccess.thecvf.com/content_cvpr_2014/papers/Zia_Are_Cars_Just_2014_CVPR_paper.pdf", "http://resources.mpi-inf.mpg.de/publications/D2/2014/zia14cvpr.pdf", "http://www.igp.ethz.ch/photogrammetry/publications/pdf_folder/cvpr2014zz.pdf"], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=6909865", "http://doi.ieeecomputersociety.org/10.1109/CVPR.2014.470", "http://doi.org/10.1109/CVPR.2014.470"]}, {"id": "f6b649023e49a341f042f9a17b2f923db58ccf35", "title": "Feature representation of RGB-D images using joint spatial-depth feature pooling", "year": "2016", "pdf": [], "doi": ["https://doi.org/10.1016/j.patrec.2016.04.001"]}, {"id": "f9f86d087e84eaf0e6a09575982aa7b41fa62451", "title": "Image Synthesis for Self-Supervised Visual Representation Learning", "year": "2018", "pdf": [], "doi": ["https://www.base-search.net/Record/6ecfef13a126fd20b941bbb80477b94bd643db70d224a43b1d0b0cb61aa181b1"]}, {"id": "b85c198ce09ffc4037582a544c7ffb6ebaeff198", "title": "Efficient Multiple Instance Metric Learning Using Weakly Supervised Data", "year": "2017", "pdf": ["http://openaccess.thecvf.com/content_cvpr_2017/papers/Law_Efficient_Multiple_Instance_CVPR_2017_paper.pdf", "http://www.cs.toronto.edu/~law/publications/CVPR/2017/mimlca_cvpr_2017.pdf"], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=8100113", "http://doi.ieeecomputersociety.org/10.1109/CVPR.2017.630", "http://doi.org/10.1109/CVPR.2017.630"]}, {"id": "c77c094faf7b1a4e293609a0909c7c50b468675a", "title": "Satyam: Democratizing Groundtruth for Machine Vision", "year": "2018", "pdf": ["https://arxiv.org/pdf/1811.03621.pdf"], "doi": []}, {"id": "2a5667702b0f1ff77dde8fb3e2e10d4e05e8de9d", "title": "Scene Parsing through ADE20K Dataset", "year": "2017", "pdf": ["http://openaccess.thecvf.com/content_cvpr_2017/papers/Zhou_Scene_Parsing_Through_CVPR_2017_paper.pdf", "http://people.csail.mit.edu/bzhou/publication/scene-parse-camera-ready.pdf"], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=8100027", "http://doi.ieeecomputersociety.org/10.1109/CVPR.2017.544", "http://doi.org/10.1109/CVPR.2017.544"]}, {"id": "a422c2bd9030c8a2c89b6db79be2743c4a4609fb", "title": "Auto Deep Compression by Reinforcement Learning Based Actor-Critic Structure", "year": "2018", "pdf": ["https://arxiv.org/pdf/1807.02886.pdf"], "doi": []}, {"id": "46a1172c784c3741e79781ef2353209b08dbea67", "title": "YouTube2Text: Recognizing and Describing Arbitrary Activities Using Semantic Hierarchies and Zero-Shot Recognition", "year": "2013", "pdf": ["http://www.cs.utexas.edu/users/ml/papers/guadarrama.iccv13.pdf", "http://www.cs.utexas.edu/users/ml/posters/guadarrama.iccv13.pdf", "http://www.eecs.berkeley.edu/~sguada/pdfs/2013-ICCV-YouTube2Text-final.pdf", "https://www.cs.utexas.edu/~vsub/pdf/YouTube2Text_Recognizing_and_2013_ICCV_paper.pdf", "https://www.icsi.berkeley.edu/pubs/vision/youtube2text13.pdf"], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=6751448", "http://doi.ieeecomputersociety.org/10.1109/ICCV.2013.337", "http://doi.org/10.1109/ICCV.2013.337"]}, {"id": "670b10569c5f978ee70d99cf8c14ad9cabb9d454", "title": "Masked face detection via a modified LeNet", "year": "2016", "pdf": [], "doi": ["http://doi.org/10.1016/j.neucom.2016.08.056"]}, {"id": "4acf31294e940d85a4eea56c244205e3a66d8b8e", "title": "Improving Product Classification Using Images", "year": "2011", "pdf": ["http://talukdar.net/papers/ImageText-ICDM2011.pdf"], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=6137235", "http://doi.ieeecomputersociety.org/10.1109/ICDM.2011.79", "http://doi.org/10.1109/ICDM.2011.79"]}, {"id": "057f5ffda59a3412f1e62159e96f84faa352628e", "title": "Tracking with scattering descriptor", "year": "2014", "pdf": [], "doi": ["http://doi.org/10.1049/iet-cvi.2013.0124"]}, {"id": "4404a99e2f6db3e703609168a3595e0fbdeabc38", "title": "Online Video SEEDS for Temporal Window Objectness", "year": "2013", "pdf": ["http://www.cv-foundation.org/openaccess/content_iccv_2013/papers/Van_Den_Bergh_Online_Video_SEEDS_2013_ICCV_paper.pdf", "http://www.mvdblive.org/research/videoseeds.pdf", "http://www.vision.ee.ethz.ch/en/publications/papers/proceedings/eth_biwi_01056.pdf"], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=6751156", "http://doi.ieeecomputersociety.org/10.1109/ICCV.2013.54", "http://doi.org/10.1109/ICCV.2013.54"]}, {"id": "59ee0f67bcf2d8ea0bbbfcbc71159725fc3a7059", "title": "Object Detection with Appearance-based Mixture Models Anonymous CVPR submission", "year": "2010", "pdf": ["https://pdfs.semanticscholar.org/59ee/0f67bcf2d8ea0bbbfcbc71159725fc3a7059.pdf"], "doi": []}, {"id": "e478c322de923337627487d8a688f5922b45b2ff", "title": "Automatic Garage Door Opening Using License Plate Recognition and Fingerprint Verification", "year": "2015", "pdf": ["https://pdfs.semanticscholar.org/e478/c322de923337627487d8a688f5922b45b2ff.pdf"], "doi": []}, {"id": "8a3b481d8e06b4acf6e95d8bc2484016f5862668", "title": "Text Detection in Traffic Informatory Signs Using Synthetic Data", "year": "2017", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=8270075", "http://doi.ieeecomputersociety.org/10.1109/ICDAR.2017.144", "http://doi.org/10.1109/ICDAR.2017.144"]}, {"id": "7c594c0b9482624745dd95767f3eebde1ee7f043", "title": "Representing Visual Scenes for Robot Control", "year": "2015", "pdf": ["https://pdfs.semanticscholar.org/7c59/4c0b9482624745dd95767f3eebde1ee7f043.pdf"], "doi": []}, {"id": "0ceda9dae8b9f322df65ca2ef02caca9758aec6f", "title": "Context-Aware CNNs for Person Head Detection", "year": "2015", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=7410688"]}, {"id": "5f0e9cc18374a670dfea4698424c9d48494f3093", "title": "Online Domain Adaptation for Multi-Object Tracking", "year": "2015", "pdf": ["https://arxiv.org/pdf/1508.00776.pdf"], "doi": []}, {"id": "d47d72afc590f5b96117a5227d45157135da21ad", "title": "Attribute-based knowledge transfer learning for human pose estimation", "year": "2013", "pdf": [], "doi": ["http://doi.org/10.1016/j.neucom.2012.05.032"]}, {"id": "05db46c7745c360fa5938ee204c81efdcc84c1da", "title": "An Empirical Evaluation of Current Convolutional Architectures\u2019 Ability to Manage Nuisance Location and Scale Variability", "year": "2016", "pdf": ["https://arxiv.org/pdf/1505.06795.pdf"], "doi": []}, {"id": "0d4cdadd765c3003b0bd5f762b84bef93408f548", "title": "Learning and Transferring Mid-level Image Representations Using Convolutional Neural Networks", "year": "2014", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=6909618"]}, {"id": "5d16ce0c66cd87dd48cb8c53f5b6a7ee73d33abb", "title": "Robust and Real-Time Object Tracking Using Scale-Adaptive Correlation Filters", "year": "2016", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=7797075", "http://doi.org/10.1109/DICTA.2016.7797075"]}, {"id": "050e5b4043009e54dff9319877fe947885db2d6e", "title": "Saliency Guided Dictionary Learning for Weakly-Supervised Image Parsing", "year": "2016", "pdf": ["http://openaccess.thecvf.com/content_cvpr_2016/papers/Lai_Saliency_Guided_Dictionary_CVPR_2016_paper.pdf", "http://www.cv-foundation.org/openaccess/content_cvpr_2016/papers/Lai_Saliency_Guided_Dictionary_CVPR_2016_paper.pdf"], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=7780764", "http://doi.ieeecomputersociety.org/10.1109/CVPR.2016.395", "http://doi.org/10.1109/CVPR.2016.395"]}, {"id": "926dd1c4db38356ac5bf87c1a4c6b93625f9a850", "title": "Pulling Actions out of Context: Explicit Separation for Effective Combination", "year": "2018", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=8578834"]}, {"id": "b705ca751a947e3b761e2305b41891051525d9df", "title": "Exploring Context with Deep Structured Models for Semantic Segmentation", "year": "2018", "pdf": ["https://arxiv.org/pdf/1603.03183.pdf"], "doi": []}, {"id": "be48b5dcd10ab834cd68d5b2a24187180e2b408f", "title": "Constrained Low-Rank Learning Using Least Squares-Based Regularization", "year": "2017", "pdf": ["https://arxiv.org/pdf/1611.04870.pdf"], "doi": []}, {"id": "b2f63863e73a8565895ca3d9d7d6a1e10a7695b1", "title": "Efficient Neural Network Compression via Transfer Learning for Industrial Optical Inspection", "year": "2018", "pdf": ["https://pdfs.semanticscholar.org/b2f6/3863e73a8565895ca3d9d7d6a1e10a7695b1.pdf"], "doi": []}, {"id": "044ae9738c2445d4fda30fcd6c289eddf8b3add9", "title": "Multiple Instance Learning: A Survey of Problem Characteristics and Applications", "year": "2018", "pdf": ["https://arxiv.org/pdf/1612.03365.pdf"], "doi": []}, {"id": "2ba540ca70c7dee81e13768792aa7571952987f6", "title": "Drivable Road Detection Based on Dilated FPN with Feature Aggregation", "year": "2017", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=8372075", "http://doi.ieeecomputersociety.org/10.1109/ICTAI.2017.00172", "http://doi.org/10.1109/ICTAI.2017.00172"]}, {"id": "6c9f45c76b4f96fe66d8e1d7b31f89b7cc6caa44", "title": "DeNet: Scalable Real-Time Object Detection with Directed Sparse Sampling", "year": "2017", "pdf": ["https://arxiv.org/pdf/1703.10295.pdf"], "doi": []}, {"id": "a0ae4ffe252f32514240cf6d82d52538de5fb78c", "title": "AN ALGORITHM FOR PEDESTRIAN DETECTION IN MULTISPECTRAL IMAGE SEQUENCES", "year": "", "pdf": ["https://pdfs.semanticscholar.org/a0ae/4ffe252f32514240cf6d82d52538de5fb78c.pdf"], "doi": []}, {"id": "115e8a4f76a57b893c985ea4f7530b90d071679c", "title": "FSSD: Feature Fusion Single Shot Multibox Detector", "year": "2017", "pdf": ["https://arxiv.org/pdf/1712.00960.pdf"], "doi": []}, {"id": "c2be82ed0db509087b08423c8cf39ab3c36549c3", "title": "Pixel-level guided face editing with fully convolution networks", "year": "2017", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=8019363", "http://doi.ieeecomputersociety.org/10.1109/ICME.2017.8019363", "http://doi.org/10.1109/ICME.2017.8019363"]}, {"id": "92f2639dbd9f7c4284b7012809e4d2c407834774", "title": "Point-based Medialness 2 D Shape Description and Identification", "year": "2015", "pdf": ["https://pdfs.semanticscholar.org/92f2/639dbd9f7c4284b7012809e4d2c407834774.pdf"], "doi": []}, {"id": "4ace7c8edd9467c7d5bfa00e942531e7b889e650", "title": "Depth-Based Hand Pose Estimation: Data, Methods, and Challenges", "year": "2015", "pdf": ["http://vision.ics.uci.edu/papers/SupancicRYSR_ICCV_2015/SupancicRYSR_ICCV_2015.pdf", "http://www.cv-foundation.org/openaccess/content_iccv_2015/papers/Supancic_Depth-Based_Hand_Pose_ICCV_2015_paper.pdf"], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=7410574", "http://doi.ieeecomputersociety.org/10.1109/ICCV.2015.217", "http://doi.org/10.1109/ICCV.2015.217"]}, {"id": "4c454fda214e00c9cba4bb759da78949a4130873", "title": "Specialization of a Generic Pedestrian Detector to a Specific Traffic Scene by the Sequential Monte-Carlo Filter and the Faster R-CNN", "year": "2017", "pdf": ["https://pdfs.semanticscholar.org/4c45/4fda214e00c9cba4bb759da78949a4130873.pdf"], "doi": []}, {"id": "f541dac9d0d49cadb3cfd018e87b26e03e3f13aa", "title": "Trio Constrained Adaptive Noise Removal ( TCANR ) Mechanism for Salt and Pepper Noise in Image Classification", "year": "2017", "pdf": ["https://pdfs.semanticscholar.org/f541/dac9d0d49cadb3cfd018e87b26e03e3f13aa.pdf"], "doi": []}, {"id": "aa2ad3df24d8d8c4a4d2fe85f0d4e635d595f0a2", "title": "PedCut: an iterative framework for pedestrian segmentation combining shape models and multiple data cues", "year": "2013", "pdf": ["https://pdfs.semanticscholar.org/c029/edca476ddda4050c3c67748056c6189cd1e3.pdf"], "doi": []}, {"id": "d250e57f6b7e06bb1dac41c8b89700086a85999e", "title": "Self-Supervised Generalisation with Meta Auxiliary Learning", "year": "2019", "pdf": ["https://arxiv.org/pdf/1901.08933.pdf"], "doi": []}, {"id": "de35ea60396629b2d1ceb73df56a97ed21012680", "title": "Robust object tracking via multi-scale patch based sparse coding histogram", "year": "2016", "pdf": [], "doi": ["https://doi.org/10.1007/s11042-016-3289-2"]}, {"id": "a0e286f3c6a72c857ffd03bd8ab9a9f9b98c4432", "title": "AI Learns to Recognize Bengali Handwritten Digits: Bengali.AI Computer Vision Challenge 2018", "year": "2018", "pdf": ["https://arxiv.org/pdf/1810.04452.pdf"], "doi": []}, {"id": "19339e816d8006ad462868b01812b03eb463ead1", "title": "Collective activity localization by spatiality preservation search", "year": "2016", "pdf": [], "doi": ["https://doi.org/10.1080/01691864.2016.1172506", "https://www.wikidata.org/entity/Q58025855"]}, {"id": "899e7ff67aa2630edc8776758cc5d65823f099c1", "title": "G-CNN: Object Detection via Grid Convolutional Neural Network", "year": "2017", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=8097417", "http://doi.org/10.1109/ACCESS.2017.2770178"]}, {"id": "139ab79a0aae5d4346f907b7b29288d09ef373fa", "title": "A Baseline for Multi-Label Image Classification Using Ensemble Deep CNN", "year": "2018", "pdf": ["https://arxiv.org/pdf/1811.08412.pdf"], "doi": []}, {"id": "94780b00dc2807ec507ae91500b622ec7a8ddb12", "title": "Selective Feature Connection Mechanism: Concatenating Multi-layer CNN Features with a Feature Selector", "year": "2018", "pdf": ["https://arxiv.org/pdf/1811.06295.pdf"], "doi": []}, {"id": "fa496716a5b8520e94a0126b5baa4f636623c997", "title": "Revisiting Knowledge Transfer for Training Object Class Detectors", "year": "2018", "pdf": ["https://arxiv.org/pdf/1708.06128.pdf"], "doi": []}, {"id": "c2cb4da617168c76c4560a01de8b5e68b5250749", "title": "FineTag: Multi-attribute Classification at Fine-grained Level in Images", "year": "2018", "pdf": ["https://arxiv.org/pdf/1806.07124.pdf"], "doi": []}, {"id": "87d5b53580ca5f77ccc3ff157337ef3456308943", "title": "Augmented Autoencoders for object orientation estimation trained on synthetic RGB images", "year": "2017", "pdf": ["https://pdfs.semanticscholar.org/87d5/b53580ca5f77ccc3ff157337ef3456308943.pdf"], "doi": []}, {"id": "eb2333a759788903848c49111a03c4c00d188e70", "title": "Color-based and Rotation Invariant Self-similarities", "year": "2017", "pdf": ["http://www.scitepress.org/Papers/2017/61075/61075.pdf"], "doi": ["https://doi.org/10.5220/0006107503440351"]}, {"id": "af9cc1767f50f63291d7ca9ab709f6849cd1e46c", "title": "Graph-Driven Diffusion and Random Walk Schemes for Image Segmentation.", "year": "2016", "pdf": ["https://pdfs.semanticscholar.org/af9c/c1767f50f63291d7ca9ab709f6849cd1e46c.pdf"], "doi": []}, {"id": "4fe91feab83d947a0d3bd85adcf18ab1b3d9e05f", "title": "Transductive People Tracking in Unconstrained Surveillance", "year": "2016", "pdf": ["http://imagelab.ing.unimore.it/Pubblicazioni/pubblicazioni/2015TCSVT.pdf"], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=7067436", "http://doi.org/10.1109/TCSVT.2015.2416555"]}, {"id": "8eaade06b75dac977574d05ce1058b86df059d47", "title": "Indoor Scene Understanding with RGB-D Images: Bottom-up Segmentation, Object Detection and Semantic Segmentation", "year": "2014", "pdf": ["http://people.eecs.berkeley.edu/~sgupta/pdf/ijcv14a.pdf"], "doi": ["https://doi.org/10.1007/s11263-014-0777-6"]}, {"id": "b9b21cfa7de32677151571ab44d27d2d246b7a03", "title": "Towards Explanation of DNN-based Prediction with Guided Feature Inversion", "year": "2018", "pdf": ["https://arxiv.org/pdf/1804.00506.pdf"], "doi": []}, {"id": "4152d2c8585f7e3f85d3b3d84036171de104cbd7", "title": "Rethinking ImageNet Pre-training", "year": "2018", "pdf": ["https://arxiv.org/pdf/1811.08883.pdf"], "doi": []}, {"id": "b31f37fd71b7b45e6fd8978960e271a7db1ee212", "title": "DICTING IMAGE ROTATIONS", "year": "2018", "pdf": ["https://pdfs.semanticscholar.org/b31f/37fd71b7b45e6fd8978960e271a7db1ee212.pdf"], "doi": []}, {"id": "149f3cc167b046dc790b1f4f1c48eeb31e898403", "title": "A study of vehicle detector generalization on U.S. highway", "year": "2016", "pdf": ["http://cvrr.ucsd.edu/publications/2016/0669.pdf"], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=7795567", "http://doi.org/10.1109/ITSC.2016.7795567"]}, {"id": "1a1654456decd116f4ca84c98006dfda0a8a3134", "title": "INTEGRATED VISUAL INFORMATION FOR MARITIME SURVEILLANCE", "year": "2015", "pdf": ["https://pdfs.semanticscholar.org/1a16/54456decd116f4ca84c98006dfda0a8a3134.pdf"], "doi": []}, {"id": "3e00dd86c084d8680409c65c1a48f1b3aa864eb7", "title": "Deep Crisp Boundaries: From Boundaries to Higher-Level Tasks", "year": "2019", "pdf": ["https://arxiv.org/pdf/1801.02439.pdf"], "doi": []}, {"id": "1e5edbd39b4c61f785515e117a74e2d280aefbe7", "title": "The urrent tate and TRL ssessment of eople racking echnology for ideo urveillance pplications", "year": "2015", "pdf": ["https://pdfs.semanticscholar.org/1e5e/dbd39b4c61f785515e117a74e2d280aefbe7.pdf"], "doi": []}, {"id": "2e1f0b522014c942197e51b556eeb48b6ad66cda", "title": "Automatic object classification using motion blob based local feature fusion for traffic scene surveillance", "year": "2012", "pdf": [], "doi": ["http://doi.org/10.1007/s11704-012-1296-7"]}, {"id": "25858dc59faf2630bf0eefe23297ce262370cff0", "title": "Monitoring Giraffe Behavior in Thermal Video", "year": "2015", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=7046812"]}, {"id": "e545f1c06799bfd2bd5f7eaed085fd60a388202f", "title": "A top-down manner-based DCNN architecture for semantic image segmentation", "year": "2017", "pdf": ["https://pdfs.semanticscholar.org/e545/f1c06799bfd2bd5f7eaed085fd60a388202f.pdf"], "doi": []}, {"id": "7b3a63d030d03e536ddcbc217bc8d6fd630e3b53", "title": "xView: Objects in Context in Overhead Imagery", "year": "2018", "pdf": ["https://arxiv.org/pdf/1802.07856.pdf"], "doi": []}, {"id": "4a6049e1926cc8e574301cfb229599cdc0a64e62", "title": "Characterizing the performance of an image-based recognizer for planar mechanical linkages in textbook graphics and hand-drawn sketches", "year": "2015", "pdf": ["http://vdel.me.cmu.edu/publications/2015cag/paper.pdf"], "doi": ["http://doi.org/10.1016/j.cag.2015.06.002"]}, {"id": "ec6f1a4b9367675833f0111c44a22ba217fcbd23", "title": "Visual Tracking via Constrained Incremental Non-negative Matrix Factorization", "year": "2015", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=7045563", "http://doi.org/10.1109/LSP.2015.2404856"]}, {"id": "5950512e21114236208b9eaeebc9a09735e367a6", "title": "Master research Internship Internship report Segmentation and recognition of symbols for printed and handwritten music scores", "year": "2016", "pdf": ["https://pdfs.semanticscholar.org/5950/512e21114236208b9eaeebc9a09735e367a6.pdf"], "doi": []}, {"id": "c7780cff11068fecb322a43e459c56267a88aee7", "title": "DeepVoting: An Explainable Framework for Semantic Part Detection under Partial Occlusion", "year": "2017", "pdf": [], "doi": []}, {"id": "98bf42055160845e6f8f3c022298e3b8e4e55f80", "title": "Vision Meets Drones: A Challenge", "year": "2018", "pdf": ["https://arxiv.org/pdf/1804.07437.pdf"], "doi": []}, {"id": "19b6b0649cc669791c799c52fc56bdc556f06916", "title": "Efficient Model Evaluation with Bilinear Separation Model", "year": "2015", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=7045964"]}, {"id": "cf58f90e14b49ce35548d89c7339b7fc4db9ba4f", "title": "Generating Diverse Image Datasets with Limited Labeling", "year": "2016", "pdf": [], "doi": ["http://dl.acm.org/citation.cfm?id=2967285"]}, {"id": "4ff486644be5e451784d6ae83f8073c8320fa974", "title": "Visual Tracking with Convolutional Neural Network", "year": "2015", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=7379494", "http://doi.org/10.1109/SMC.2015.362"]}, {"id": "a43f460f6c1abbe8eb0097594df6eafc0f651d49", "title": "Saliency-based object recognition in video", "year": "2017", "pdf": ["https://pdfs.semanticscholar.org/a43f/460f6c1abbe8eb0097594df6eafc0f651d49.pdf"], "doi": []}, {"id": "b4df58f1fd8a3bd0815e7fb957f7f07fddd77338", "title": "Rethinking the sGLOH Descriptor", "year": "2018", "pdf": ["http://cvg.dsi.unifi.it/colombo_now/CC/Public/sGLOH2_TPAMI_2017.pdf"], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=7911291", "http://doi.org/10.1109/TPAMI.2017.2697849", "https://www.ncbi.nlm.nih.gov/pubmed/28459683", "https://www.wikidata.org/entity/Q38811217"]}, {"id": "ceee9ba72a021ae5604db04a93fdcff421d60216", "title": "Encoder Based Lifelong Learning", "year": "2017", "pdf": ["https://arxiv.org/pdf/1704.01920.pdf"], "doi": []}, {"id": "c4a0e89793961dc486964802df55ae73fbba60ee", "title": "Soccer: Who Has the Ball? Generating Visual Analytics and Player Statistics", "year": "2018", "pdf": ["http://openaccess.thecvf.com/content_cvpr_2018_workshops/papers/w34/Theagarajan_Soccer_Who_Has_CVPR_2018_paper.pdf", "http://vislab.ucr.edu/PUBLICATIONS/pubs/Journal%20and%20Conference%20Papers/after10-1-1997/Conference/2018/FINAL-published-soccer-ball-generating.pdf"], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=8575390", "http://doi.ieeecomputersociety.org/10.1109/CVPRW.2018.00227", "http://doi.org/10.1109/CVPRW.2018.00227"]}, {"id": "2622d2467f19bc60427f8ea495515e7da82316c9", "title": "Tell Me Where to Look: Guided Attention Inference Network", "year": "2018", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=8579058"]}, {"id": "ccee8af5667d1d3bccf30baf2c6f049f031bb5ad", "title": "Mixing Hierarchical Contexts for Object Recognition", "year": "2011", "pdf": ["http://web.ing.puc.cl/~asoto/papers/Peralta-2011.pdf"], "doi": ["https://doi.org/10.1007/978-3-642-25085-9_27"]}, {"id": "c96f012f4915398259e7e223810c57898b5e1a76", "title": "Fast LIDAR-based Road Detection Using Convolutional Neural Networks", "year": "2017", "pdf": ["https://pdfs.semanticscholar.org/c96f/012f4915398259e7e223810c57898b5e1a76.pdf"], "doi": []}, {"id": "7142e659d6466717cdb8a242d8e34fce176b3f4a", "title": "Improved scene identification and object detection on egocentric vision of daily activities", "year": "2017", "pdf": ["http://crcv.ucf.edu/news&info/DefenseBooklet_FA17.pdf", "http://crcv.ucf.edu/papers/cviu2016-gonzalo.pdf", "http://vision.eecs.ucf.edu/papers/cviu2016-gonzalo.pdf"], "doi": ["http://doi.org/10.1016/j.cviu.2016.10.016"]}, {"id": "3b483c986b973856e016f761ec312c1a339766a5", "title": "DOTA: A Large-Scale Dataset for Object Detection in Aerial Images", "year": "2018", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=8578516"]}, {"id": "1281e443d2cf1c1dd71ed3b7b0376d408d0958af", "title": "SALICON: Reducing the Semantic Gap in Saliency Prediction by Adapting Deep Neural Networks", "year": "2015", "pdf": ["http://www.cs.cornell.edu/~xhuang/publications/salicon_poster.pdf", "http://www.cv-foundation.org/openaccess/content_iccv_2015/papers/Huang_SALICON_Reducing_the_ICCV_2015_paper.pdf"], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=7410395", "http://doi.ieeecomputersociety.org/10.1109/ICCV.2015.38", "http://doi.org/10.1109/ICCV.2015.38"]}, {"id": "71f7be73a575f3689b0137446289d02462e1c5b0", "title": "Adaptive Multi-Scale Information Flow for Object Detection.", "year": "2018", "pdf": ["http://bmvc2018.org/contents/papers/0266.pdf"], "doi": []}, {"id": "581fb0f0405c7f0e60610d88ceaceb9af44d8569", "title": "Final Report : Smart Trash Net : Waste Localization and Classification", "year": "2017", "pdf": ["https://pdfs.semanticscholar.org/581f/b0f0405c7f0e60610d88ceaceb9af44d8569.pdf"], "doi": []}, {"id": "eaa7c6293c9d858bd4c9897a5dfc7c670f2a8671", "title": "Distant Vehicle Detection Using Radar and Vision", "year": "2019", "pdf": ["https://arxiv.org/pdf/1901.10951.pdf"], "doi": []}, {"id": "2cea306754ed83eaf1d0433abbfb05b5a4c4cf48", "title": "BIG-OH: BInarization of gradient orientation histograms", "year": "2014", "pdf": ["http://vgl-ait.org/mdailey/uploads/publication_file/filename/110/Baber-BIG-OH.pdf"], "doi": ["http://doi.org/10.1016/j.imavis.2014.08.006"]}, {"id": "eb2ab9caa61b021c1cd7aff6d08163768faba99e", "title": "Cleaning Up Multiple Detections Caused by Sliding Window Based Object Detectors", "year": "2013", "pdf": ["https://pdfs.semanticscholar.org/eb2a/b9caa61b021c1cd7aff6d08163768faba99e.pdf"], "doi": []}, {"id": "5a364ecb2d10b637c63b885d27eb372390232277", "title": "Unsupervised Robust Feature-Based Partition Ensembling to Discover Categories", "year": "2016", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=7789641"]}, {"id": "1114c2aba97a5782a48341817811df2438d0fdbf", "title": "Robust Visual Tracking using Multi-Frame Multi-Feature Joint Modeling", "year": "2018", "pdf": ["https://arxiv.org/pdf/1811.07498.pdf"], "doi": []}, {"id": "367008b91eb57c5ea64ef7520dfcabc0c5c85532", "title": "Person Re-identification: Past, Present and Future", "year": "2016", "pdf": ["https://arxiv.org/pdf/1610.02984.pdf"], "doi": []}, {"id": "8211c974ec152e79235cb57a03ba2971e913508f", "title": "Multimodal Image Retrieval", "year": "2012", "pdf": [], "doi": ["https://doi.org/10.1007/s13735-012-0006-4"]}, {"id": "eb69f89588e9538194750f12bf8c8df6d5301f3b", "title": "Object Tracking by a Combination of Discriminative Global and Generative Multi-Scale Local Models", "year": "2017", "pdf": ["https://pdfs.semanticscholar.org/eb69/f89588e9538194750f12bf8c8df6d5301f3b.pdf"], "doi": []}, {"id": "d6bdc70d259b38bbeb3a78db064232b4b4acc88f", "title": "Video-Based Face Association and Identification", "year": "2017", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=7961735", "http://doi.ieeecomputersociety.org/10.1109/FG.2017.27", "http://doi.org/10.1109/FG.2017.27"]}, {"id": "d2e8efaa0d095c22455fe4eab260f94994bfb116", "title": "Stand-alone quality estimation of background subtraction algorithms", "year": "2017", "pdf": [], "doi": ["http://doi.org/10.1016/j.cviu.2017.08.005"]}, {"id": "abe9f3b91fd26fa1b50cd685c0d20debfb372f73", "title": "The Pascal Visual Object Classes Challenge: A Retrospective", "year": "2014", "pdf": ["http://homepages.inf.ed.ac.uk/ckiw/postscript/ijcv_voc14.pdf", "http://www.robots.ox.ac.uk/~vgg/publications/2015/Everingham15/everingham15.pdf", "https://www.research.ed.ac.uk/portal/files/20017166/ijcv_voc14.pdf"], "doi": ["http://doi.org/10.1007/s11263-014-0733-5"]}, {"id": "10d3f77225eca1d576268ba84ed83f230a5e47c4", "title": "Crafting a multi-task CNN for viewpoint estimation", "year": "2016", "pdf": ["https://arxiv.org/pdf/1609.03894.pdf"], "doi": []}, {"id": "a01c7eec51fa901b2526325f563480c152c58ee5", "title": "Contour Box: Rejecting Object Proposals without Explicit Closed Contours", "year": "2015", "pdf": ["http://openaccess.thecvf.com/content_iccv_2015/papers/Lu_Contour_Box_Rejecting_ICCV_2015_paper.pdf", "http://www.cse.cuhk.edu.hk/leojia/papers/contour_iccv15.pdf", "http://www.cv-foundation.org/openaccess/content_iccv_2015/papers/Lu_Contour_Box_Rejecting_ICCV_2015_paper.pdf"], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=7410591", "http://doi.ieeecomputersociety.org/10.1109/ICCV.2015.234", "http://doi.org/10.1109/ICCV.2015.234"]}, {"id": "3db4bdee7bc03239ef25d23cf8dc14ce5a5300e2", "title": "Sparse Coding for Object Recognition", "year": "2013", "pdf": [], "doi": []}, {"id": "32cde90437ab5a70cf003ea36f66f2de0e24b3ab", "title": "The Cityscapes Dataset for Semantic Urban Scene Understanding", "year": "2016", "pdf": ["https://arxiv.org/pdf/1604.01685.pdf"], "doi": []}, {"id": "39978ba7c83333475d6825d0ff897692933895fc", "title": "Conditional Random Fields as Recurrent Neural Networks", "year": "2015", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=7410536"]}, {"id": "aa23d33983b1abd2d8a677040eb875e93c478a7f", "title": "Measuring the Objectness of Image Windows", "year": "2012", "pdf": ["http://groups.inf.ed.ac.uk/calvin/Publications/alexe11-techreport.pdf", "http://groups.inf.ed.ac.uk/calvin/Publications/alexe12pami.pdf", "http://www.vision.ee.ethz.ch/en/publications/papers/techreports/eth_biwi_00882.pdf", "https://www.research.ed.ac.uk/portal/files/17686204/Alexe_et_al_2010_Measuring_the_objectnessi.pdf"], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=6133291", "http://doi.org/10.1109/TPAMI.2012.28", "https://www.ncbi.nlm.nih.gov/pubmed/22248633", "https://www.wikidata.org/entity/Q50666022"]}, {"id": "cab372bc3824780cce20d9dd1c22d4df39ed081a", "title": "DeepLab: Semantic Image Segmentation with Deep Convolutional Nets, Atrous Convolution, and Fully Connected CRFs", "year": "2018", "pdf": ["https://arxiv.org/pdf/1606.00915.pdf"], "doi": []}, {"id": "04e1c7618e4ef3e16159b27c522ddf94068c4f99", "title": "Reconstructing PASCAL VOC", "year": "2014", "pdf": ["http://home.isr.uc.pt/~joaoluis/papers/cvpr14_reconstruct_pascal_slides.pdf", "http://home.isr.uc.pt/~joaoluis/papers/cvpr2014_1.pdf", "http://people.eecs.berkeley.edu/~carreira/papers/cvpr14_reconstruct_pascal_slides.pdf", "http://people.eecs.berkeley.edu/~carreira/papers/cvpr2014_1.pdf", "http://www.cv-foundation.org/openaccess/content_cvpr_2014/papers/Vicente_Reconstructing_PASCAL_VOC_2014_CVPR_paper.pdf"], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=6909407", "http://doi.ieeecomputersociety.org/10.1109/CVPR.2014.13", "http://doi.org/10.1109/CVPR.2014.13"]}, {"id": "b183947ee15718b45546eda6b01e179b9a95421f", "title": "Edge Boxes: Locating Object Proposals from Edges", "year": "2014", "pdf": ["http://vigir.missouri.edu/~gdesouza/Research/Conference_CDs/ECCV_2014/papers/8693/86930391.pdf", "http://vision.ucsd.edu/~pdollar/files/papers/ZitnickDollarECCV14edgeBoxes.pdf", "http://www.robots.ox.ac.uk/~vgg/rg/papers/ZitnickDollarECCV14edgeBoxes.pdf"], "doi": ["https://doi.org/10.1007/978-3-319-10602-1_26"]}, {"id": "127316fbe268c78c519ceb23d41100e86639418a", "title": "CNN Features Off-the-Shelf: An Astounding Baseline for Recognition", "year": "2014", "pdf": ["https://arxiv.org/pdf/1403.6382.pdf"], "doi": []}, {"id": "148686aebefff0a7fb3f80024f765ef4b06d2efc", "title": "Learning Rich Features from RGB-D Images for Object Detection and Segmentation", "year": "2014", "pdf": ["https://arxiv.org/pdf/1407.5736.pdf"], "doi": []}, {"id": "1fef45786e707e6b9b8517b0403e596ecbdea6a5", "title": "Sketch-based manga retrieval using manga109 dataset", "year": "2016", "pdf": ["https://arxiv.org/pdf/1510.04389.pdf"], "doi": []}, {"id": "4a19f6545473363b16d4a10ed13fef29b38856d3", "title": "What is a Salient Object? A Dataset and a Baseline Model for Salient Object Detection", "year": "2015", "pdf": ["https://arxiv.org/pdf/1412.5027.pdf"], "doi": []}, {"id": "7d39d69b23424446f0400ef603b2e3e22d0309d6", "title": "YOLO9000: Better, Faster, Stronger", "year": "2017", "pdf": ["https://arxiv.org/pdf/1612.08242.pdf"], "doi": []}, {"id": "9bde2137a6a374ff81820e55a75ae5b70bf7fd5e", "title": "PLS/OPLS models in metabolomics: the impact of permutation of dataset rows on the K-fold cross-validation quality parameters.", "year": "2015", "pdf": [], "doi": ["https://www.ncbi.nlm.nih.gov/pubmed/25382277", "https://doi.org/10.1039/C4MB00414K"]}, {"id": "00bc01bc02b4c602e28bbcc162fa33d449a1e0e6", "title": "Action from Still Image Dataset and Inverse Optimal Control to Learn Task Specific Visual Scanpaths", "year": "2013", "pdf": ["https://pdfs.semanticscholar.org/00bc/01bc02b4c602e28bbcc162fa33d449a1e0e6.pdf"], "doi": []}, {"id": "bfa6ad4d71008505729274d008a9b4a7d92b2985", "title": "Semantic Understanding of Scenes Through the ADE20K Dataset", "year": "2018", "pdf": ["https://arxiv.org/pdf/1608.05442.pdf"], "doi": []}, {"id": "21a1654b856cf0c64e60e58258669b374cb05539", "title": "You Only Look Once: Unified, Real-Time Object Detection", "year": "2016", "pdf": ["https://arxiv.org/pdf/1506.02640.pdf"], "doi": []}, {"id": "12660f0defc6580e566c0fa2ac909971d6c6883b", "title": "The SYNTHIA Dataset: A Large Collection of Synthetic Images for Semantic Segmentation of Urban Scenes", "year": "2016", "pdf": ["http://openaccess.thecvf.com/content_cvpr_2016/papers/Ros_The_SYNTHIA_Dataset_CVPR_2016_paper.pdf", "http://www.cv-foundation.org/openaccess/content_cvpr_2016/papers/Ros_The_SYNTHIA_Dataset_CVPR_2016_paper.pdf"], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=7780721", "http://doi.org/10.1109/CVPR.2016.352", "https://www.wikidata.org/entity/Q57840870"]}, {"id": "ec187cedb69b389d06da26b17d889020e36ba6f6", "title": "ModaNet: A Large-scale Street Fashion Dataset with Polygon Annotations", "year": "2018", "pdf": [], "doi": ["http://dl.acm.org/citation.cfm?id=3240652"]}, {"id": "dcb6f06631021811091ce691592b12a237c12907", "title": "SeaShips: A Large-Scale Precisely Annotated Dataset for Ship Detection", "year": "2018", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=8438999", "http://doi.org/10.1109/TMM.2018.2865686"]}, {"id": "562463fafacca4bbe5256e318eb628bf915f4114", "title": "SLNSW-UTS: A Historical Image Dataset for Image Multi-Labeling and Retrieval", "year": "2016", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=7797084"]}, {"id": "8bc80a5d721757868d85d9e40c56c15d9b5c0df0", "title": "Total-Text: A Comprehensive Dataset for Scene Text Detection and Recognition", "year": "2017", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=8270088"]}, {"id": "a8f24fcc1eb0354ffd91f0e3031f5c4dc3e02dd6", "title": "R-FCN: Object Detection via Region-based Fully Convolutional Networks", "year": "2016", "pdf": ["https://arxiv.org/pdf/1605.06409.pdf"], "doi": []}, {"id": "51a4d658c93c5169eef7568d3d1cf53e8e495087", "title": "Unsupervised Visual Domain Adaptation Using Subspace Alignment", "year": "2013", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=6751479"]}, {"id": "20a78d3145279dcd799cd7a856ae2714f4863a16", "title": "SSD: Single Shot MultiBox Detector", "year": "2016", "pdf": ["https://arxiv.org/pdf/1512.02325.pdf"], "doi": []}, {"id": "165ef2b5f86b9b2c68b652391db5ece8c5a0bc7e", "title": "Efficient Piecewise Training of Deep Structured Models for Semantic Segmentation", "year": "2016", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=7780717"]}, {"id": "061356704ec86334dbbc073985375fe13cd39088", "title": "Very Deep Convolutional Networks for Large-Scale Image Recognition", "year": "2015", "pdf": ["https://arxiv.org/pdf/1409.1556.pdf"], "doi": []}, {"id": "bf5f67ebbe41f2fb1726a7c3c0be707366d5a4fb", "title": "Indoor Segmentation and Support Inference from RGBD Images", "year": "2012", "pdf": ["http://cs.nyu.edu/~silberman/papers/indoor_seg_support.pdf", "http://cs.nyu.edu/~silberman/papers/indoor_seg_support_supplementary.pdf", "http://videolectures.net/site/normal_dl/tag=725527/eccv2012_silberman_images_01.pdf", "http://web.engr.illinois.edu/~dhoiem/publications/eccv2012_indoorkinect_nathan.pdf"], "doi": ["https://doi.org/10.1007/978-3-642-33715-4_54"]}, {"id": "2dc9b005e936c9c303386caacc8d41cabdb1a0a1", "title": "Return of the Devil in the Details: Delving Deep into Convolutional Nets", "year": "2014", "pdf": ["https://arxiv.org/pdf/1405.3531.pdf"], "doi": []}, {"id": "2f56b1ac5b9faac9527b6814778925e9242cf5fd", "title": "Training Region-Based Object Detectors with Online Hard Example Mining", "year": "2016", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=7780458"]}, {"id": "42764b57d0794b63487a295ce8c07eeb6961477e", "title": "Instance-Aware Semantic Segmentation via Multi-task Network Cascades", "year": "2016", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=7780712"]}, {"id": "6a1b76f1ef876061ec479ab9bc13fcd517eb4188", "title": "Large Kernel Matters \u2014 Improve Semantic Segmentation by Global Convolutional Network", "year": "2017", "pdf": ["https://arxiv.org/pdf/1703.02719.pdf"], "doi": []}, {"id": "2c03df8b48bf3fa39054345bafabfeff15bfd11d", "title": "Deep Residual Learning for Image Recognition", "year": "2016", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=7780459"]}, {"id": "24d66ec9dd202a6ea02b8723ae9d2fd7ffd32a4a", "title": "BING: Binarized Normed Gradients for Objectness Estimation at 300fps", "year": "2014", "pdf": ["http://ais.informatik.uni-freiburg.de/teaching/ws14/seminar_robotperception/papers/paper_01.pdf", "http://mmcheng.net/mftp/Papers/BingPoster.pdf", "http://mmcheng.net/mftp/Papers/ObjectnessBING.pdf", "http://orca-mwe.cf.ac.uk/115427/1/CvmBING.pdf", "http://www.cs.ucf.edu/courses/cap6412/spr2014/papers/BING-Binarized-Normed-Gradients-for-Objectness-Estimation-at-300fps.pdf", "http://www.cv-foundation.org/openaccess/content_cvpr_2014/papers/Cheng_BING_Binarized_Normed_2014_CVPR_paper.pdf", "http://www.robots.ox.ac.uk/~vgg/rg/papers/14cvprObjectnessBING.pdf", "https://zimingzhang.files.wordpress.com/2014/10/14cvprobjectnessbing.pdf"], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=6909816", "http://doi.ieeecomputersociety.org/10.1109/CVPR.2014.414", "http://doi.org/10.1109/CVPR.2014.414"]}, {"id": "21d4258394a9c8f0ea15f0792d67f7e645720ff6", "title": "Multiscale Combinatorial Grouping", "year": "2014", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=6909443"]}, {"id": "58a6eb3584b2f5df2f25d39a218904d510cae516", "title": "The UAVid Dataset for Video Semantic Segmentation", "year": "2018", "pdf": ["https://arxiv.org/pdf/1810.10438.pdf"], "doi": []}, {"id": "1779b6a17ee68afafb6801477b165f19901689b2", "title": "Object Contour Detection with a Fully Convolutional Encoder-Decoder Network", "year": "2016", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=7780397"]}, {"id": "ab9d87a03ce3538ff42b6c26d87e676107cc392c", "title": "Looking Beyond the Image: Unsupervised Learning for Object Saliency and Detection", "year": "2013", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=6619260"]}, {"id": "3cdb1364c3e66443e1c2182474d44b2fb01cd584", "title": "SegNet: A Deep Convolutional Encoder-Decoder Architecture for Image Segmentation", "year": "2017", "pdf": ["https://arxiv.org/pdf/1511.00561.pdf"], "doi": []}, {"id": "b92a1ed9622b8268ae3ac9090e25789fc41cc9b8", "title": "Pooling in image representation: The visual codeword point of view", "year": "2013", "pdf": ["http://cedric.cnam.fr/~thomen/papers/avila_CVIU2012_final.pdf", "http://webia.lip6.fr/~thomen/papers/avila_CVIU2012_accepted.pdf"], "doi": ["https://doi.org/10.1016/j.cviu.2012.09.007"]}, {"id": "3282ae3a0111d4ff1176c513a0c65e9351f045e4", "title": "Generating Object Segmentation Proposals Using Global and Local Search", "year": "2014", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=6909706"]}, {"id": "db7d44d14d393d21a95d22c0d6132d9faa197b7d", "title": "Interactive comment on \u201c What effect does VOC sampling time have on derived OH reactivity ? \u201d by", "year": "2016", "pdf": ["https://pdfs.semanticscholar.org/cc59/6c392c1367be2f78600a092de090e086ecd2.pdf"], "doi": []}, {"id": "76d6a8b09432b4ae59d1e3606e1bf1ed0448e8ec", "title": "What effect does VOC sampling time have on derived OH 1 reactivity ? 2 3", "year": "2016", "pdf": ["https://pdfs.semanticscholar.org/fe78/29d0620f3173581b93c78d6310740812fa09.pdf"], "doi": []}, {"id": "09e15bb266da86d0a9525d2a94ac0b38f0b53b88", "title": "Detect What You Can: Detecting and Representing Objects Using Holistic Models and Body Parts", "year": "2014", "pdf": ["https://arxiv.org/pdf/1406.2031.pdf"], "doi": []}, {"id": "031055c241b92d66b6984643eb9e05fd605f24e2", "title": "Multi-fold MIL Training for Weakly Supervised Object Localization", "year": "2014", "pdf": ["http://www.cv-foundation.org/openaccess/content_cvpr_2014/papers/Cinbis_Multi-fold_MIL_Training_2014_CVPR_paper.pdf", "https://hal.inria.fr/hal-00975746/PDF/paper.pdf"], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=6909705", "http://doi.ieeecomputersociety.org/10.1109/CVPR.2014.309", "http://doi.org/10.1109/CVPR.2014.309"]}, {"id": "501d004186c1ebe7da5e3a0631624e0b55ebeabb", "title": "Learning Coupled Feature Spaces for Cross-Modal Matching", "year": "2013", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=6751370"]}, {"id": "e1c17b0271c12033e78662d6d7ccb56ad321992c", "title": "Interactive comment on \u201c Impact of VOCs on the formation of ozone in a central China city during severe pollution periods \u201d by Bowei", "year": "2018", "pdf": ["https://pdfs.semanticscholar.org/e1c1/7b0271c12033e78662d6d7ccb56ad321992c.pdf"], "doi": []}, {"id": "aa4cc6506e837390486e5b836fb3dac8d15daafa", "title": "ThermalGAN: Multimodal Color-to-Thermal Image Translation for Person Re-identification in Multispectral Dataset", "year": "2018", "pdf": ["http://openaccess.thecvf.com/content_ECCVW_2018/papers/11134/Kniaz_ThermalGAN_Multimodal_Color-to-Thermal_Image_Translation_for_Person_Re-Identification_in_Multispectral_ECCVW_2018_paper.pdf"], "doi": ["https://doi.org/10.1007/978-3-030-11024-6_46"]}, {"id": "b0204e6c7301281ec8460e5251cd7c3c83c40883", "title": "Pano-RSOD: A Dataset and Benchmark for Panoramic Road Scene Object Detection", "year": "2019", "pdf": ["https://pdfs.semanticscholar.org/b020/4e6c7301281ec8460e5251cd7c3c83c40883.pdf"], "doi": []}, {"id": "522fab628aab972f39835521e31564b4b6c64fe5", "title": "Vehicle Classification on Low-resolution and Occluded images : A low-cost labeled dataset for augmentation", "year": "2017", "pdf": ["https://pdfs.semanticscholar.org/522f/ab628aab972f39835521e31564b4b6c64fe5.pdf"], "doi": []}, {"id": "79267f6c2df78cca735e0bf7ed27b9f9ff263224", "title": "Instance-sensitive Fully Convolutional Networks", "year": "2016", "pdf": ["https://arxiv.org/pdf/1603.08678.pdf"], "doi": []}, {"id": "2ec2f8cd6cf1a393acbc7881b8c81a78269cf5f7", "title": "Learning Image Embeddings using Convolutional Neural Networks for Improved Multi-Modal Semantics", "year": "2014", "pdf": ["https://pdfs.semanticscholar.org/2ec2/f8cd6cf1a393acbc7881b8c81a78269cf5f7.pdf"], "doi": []}, {"id": "851a884a89a95968c2edcad9787994ccaa8b51a8", "title": "BING: Binarized normed gradients for objectness estimation at 300fps", "year": "2018", "pdf": ["http://mmcheng.net/mftp/Papers/ObjectnessBING.pdf", "http://vision.ia.ac.cn/zh/senimar/reports/2014.5.6PPT.pdf"], "doi": ["https://doi.org/10.1007/s41095-018-0120-1"]}, {"id": "f78db8e59ba354258c3eb4fff2ec67564975436f", "title": "Improving Annotation for 3D Pose Dataset of Fine-Grained Object Categories", "year": "2018", "pdf": ["https://arxiv.org/pdf/1810.09263.pdf"], "doi": []}, {"id": "6de2b1058c5b717878cce4e7e50d3a372cc4aaa6", "title": "Generative Adversarial Nets", "year": "2014", "pdf": ["https://pdfs.semanticscholar.org/6de2/b1058c5b717878cce4e7e50d3a372cc4aaa6.pdf"], "doi": []}, {"id": "16fc1065c296840cb0f8ca62601aa17b7f0a02bf", "title": "Object Detection with Discriminatively Trained Part-Based Models", "year": "2014", "pdf": ["https://pdfs.semanticscholar.org/16fc/1065c296840cb0f8ca62601aa17b7f0a02bf.pdf"], "doi": []}, {"id": "1c0e8c3fb143eb5eb5af3026eae7257255fcf814", "title": "Weakly Supervised Deep Detection Networks", "year": "2016", "pdf": ["https://arxiv.org/pdf/1511.02853.pdf"], "doi": []}, {"id": "67490b6f34c827f107b046adeef0f5476132d4f8", "title": "How good are detection proposals, really?", "year": "2014", "pdf": ["https://arxiv.org/pdf/1406.6962.pdf"], "doi": []}, {"id": "00f8d6db6cf5c5e2a9df1604a09db06d8eb574dd", "title": "Geometric Mining: Scaling Geometric Hashing to Large Datasets", "year": "2015", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=7406484"]}, {"id": "33da83b54410af11d0cd18fd07c74e1a99f67e84", "title": "DeCAF: A Deep Convolutional Activation Feature for Generic Visual Recognition", "year": "2014", "pdf": ["https://arxiv.org/pdf/1310.1531.pdf"], "doi": []}, {"id": "428017f7a6df4d667275c7ac9b3feba39b70e4ae", "title": "CNN-RNN: A Unified Framework for Multi-label Image Classification", "year": "2016", "pdf": ["https://arxiv.org/pdf/1604.04573.pdf"], "doi": []}, {"id": "1cf29a0131211079fc73908ecf211ee78f090ad9", "title": "Regionlets for Generic Object Detection", "year": "2013", "pdf": ["http://image-net.org/challenges/LSVRC/2013/slides/ILSVRC2013_NEC.pdf", "http://users.eecs.northwestern.edu/~mya671/mypapers/ICCV13_Wang_Yang_Zhu_Lin.pdf", "http://vc.cs.nthu.edu.tw/home/paper/codfiles/melu/201510210855/regionlets.pdf", "http://web.missouri.edu/~hantx/ECE8001/Presentation_papers/Regionlets%20for%20Generic%20Object%20Detection.pdf", "http://www.cv-foundation.org/openaccess/content_iccv_2013/papers/Wang_Regionlets_for_Generic_2013_ICCV_paper.pdf", "http://www.ece.northwestern.edu/~mya671/mypapers/ICCV13_Wang_Yang_Zhu_Lin.pdf", "http://www.xiaoyumu.com/s//PDF/Regionlets.pdf", "http://www.xiaoyumu.com/s/PDF/Regionlets-pami.pdf", "http://www.xiaoyumu.com/s/slides/Regionlets_imagenet_web.pdf"], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=6751111", "http://doi.ieeecomputersociety.org/10.1109/ICCV.2013.10", "http://doi.org/10.1109/TPAMI.2015.2389830", "https://www.ncbi.nlm.nih.gov/pubmed/26353185", "https://www.wikidata.org/entity/Q50562532"]}, {"id": "08fe9658c086b842980e86c66bde3cef95bb6bec", "title": "Deformable part models are convolutional neural networks", "year": "2015", "pdf": ["https://arxiv.org/pdf/1409.5403.pdf"], "doi": []}, {"id": "6f9f143ec602aac743e07d092165b708fa8f1473", "title": "SegNet: A Deep Convolutional Encoder-Decoder Architecture for Robust Semantic Pixel-Wise Labelling", "year": "2015", "pdf": ["https://arxiv.org/pdf/1505.07293.pdf"], "doi": []}, {"id": "79cfb51a51fc093f66aac8e858afe2e14d4a1f20", "title": "Focal Loss for Dense Object Detection", "year": "2017", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=8237586"]}, {"id": "2640a376c2b51f83420526646613e85d730eab37", "title": "Saliency Detection via Graph-Based Manifold Ranking", "year": "2013", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=6619251"]}, {"id": "3dd2f70f48588e9bb89f1e5eec7f0d8750dd920a", "title": "Fast R-CNN", "year": "2015", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=7410526"]}, {"id": "c88c233c50f49b4b85a8702d5ee384d96fca8c23", "title": "Object-Proposal Evaluation Protocol is \u2018Gameable\u2019", "year": "2016", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=7780466"]}, {"id": "2a94c84383ee3de5e6211d43d16e7de387f68878", "title": "Feature Pyramid Networks for Object Detection", "year": "2017", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=8099589"]}, {"id": "1f45b6d800108a277f4b2866420eefee3d2581e0", "title": "Deeply Learning the Messages in Message Passing Inference", "year": "2015", "pdf": ["https://arxiv.org/pdf/1506.02108.pdf"], "doi": []}, {"id": "35173e7bff5490a1701d02eda6f406a404111953", "title": "Deep Exemplar 2D-3D Detection by Adapting from Real to Rendered Views", "year": "2016", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=7781017"]}, {"id": "cdfe4e46d949b68c682e554c402d16679fd7247c", "title": "Stacked Deconvolutional Network for Semantic Segmentation", "year": "2017", "pdf": ["https://arxiv.org/pdf/1708.04943.pdf"], "doi": []}, {"id": "6641cbc41ad0b4660fa48036e38535a7b6174554", "title": "Weakly-Supervised Semantic Segmentation using Motion Cues", "year": "2016", "pdf": ["https://arxiv.org/pdf/1603.07188.pdf"], "doi": []}, {"id": "647c6ac5e0bfee0241d583650f18c6314f28aaee", "title": "Segmentation Driven Object Detection with Fisher Vectors", "year": "2013", "pdf": ["http://www.cv-foundation.org/openaccess/content_iccv_2013/papers/Cinbis_Segmentation_Driven_Object_2013_ICCV_paper.pdf"], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=6751480", "http://doi.ieeecomputersociety.org/10.1109/ICCV.2013.369", "http://doi.org/10.1109/ICCV.2013.369"]}, {"id": "1cf25786f1e473fdbfcd817cfa37b0ad12806e72", "title": "Co-segmentation by Composition", "year": "2013", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=6751271"]}, {"id": "272216c1f097706721096669d85b2843c23fa77d", "title": "Adam: A Method for Stochastic Optimization", "year": "2015", "pdf": ["https://arxiv.org/pdf/1412.6980.pdf"], "doi": []}, {"id": "2315fc6c2c0c4abd2443e26a26e7bb86df8e24cc", "title": "ImageNet Classification with Deep Convolutional Neural Networks", "year": "2012", "pdf": [], "doi": ["http://dl.acm.org/citation.cfm?id=3065386"]}, {"id": "b9c830332608afbbf452a20afeff38ca5aac2e27", "title": "Towards Computational Baby Learning: A Weakly-Supervised Approach for Object Detection", "year": "2015", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=7410477"]}, {"id": "3671d0262c502e292fa8d2333ab50b3e827dbcee", "title": "Relaxed Multiple-Instance SVM with Application to Object Discovery", "year": "2015", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=7410502"]}, {"id": "14b5e8ba23860f440ea83ed4770e662b2a111119", "title": "Visualizing and Understanding Convolutional Networks", "year": "2014", "pdf": ["https://arxiv.org/pdf/1311.2901.pdf"], "doi": []}, {"id": "3bde1aae1db3577938ffe910a9de5a1f187840e9", "title": "RIFD-CNN: Rotation-Invariant and Fisher Discriminative Convolutional Neural Networks for Object Detection", "year": "2016", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=7780684"]}, {"id": "3d1053a1021a48538fd47c9689a81888d63ff37e", "title": "Parameter Learning and Convergent Inference for Dense Random Fields", "year": "2013", "pdf": ["https://pdfs.semanticscholar.org/f544/b3aeeb2b3690cb90bf568cfe92d864107c9f.pdf"], "doi": []}, {"id": "e257d1df3d9f979e37e97fe65f879a12703f80bd", "title": "Fast Image Classification by Boosting Fuzzy Classifiers", "year": "2016", "pdf": ["https://arxiv.org/pdf/1610.01068.pdf"], "doi": []}, {"id": "4c5a07ab1700a67afaf16fc9a7a2647f51358255", "title": "DeepSaliency: Multi-Task Deep Neural Network Model for Salient Object Detection", "year": "2016", "pdf": ["https://arxiv.org/pdf/1510.05484.pdf"], "doi": []}, {"id": "94c5ced03a6f896a4b3bc5a98b8b2baf349d8852", "title": "Fully Convolutional Instance-Aware Semantic Segmentation", "year": "2017", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=8099955"]}, {"id": "beac53e8074b4822943a3374ff5e9fed98a891b8", "title": "Generate to Adapt: Aligning Domains Using Generative Adversarial Networks", "year": "2018", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=8578985"]}, {"id": "db14833dde228b911c7a1cbf025fdd78736eb520", "title": "Transfer Learning with Deep Convolutional Neural Network for SAR Target Classification with Limited Labeled Data", "year": "2017", "pdf": ["https://pdfs.semanticscholar.org/db14/833dde228b911c7a1cbf025fdd78736eb520.pdf"], "doi": []}, {"id": "c0a0adb7f02d5509969e6107c914f7cc6e9ec881", "title": "Semantic Instance Segmentation via Deep Metric Learning", "year": "2017", "pdf": ["https://arxiv.org/pdf/1703.10277.pdf"], "doi": []}, {"id": "59c2f171f95941b5e36fc56fcbc6fa4d66b5fb55", "title": "Unsupervised Learning of Visual Representations by Solving Jigsaw Puzzles", "year": "2016", "pdf": ["https://arxiv.org/pdf/1603.09246.pdf"], "doi": []}, {"id": "5c44807fb7a38d4c9c3ef3bdfb950b44c4a02a3f", "title": "Viewpoints and keypoints", "year": "2015", "pdf": ["https://arxiv.org/pdf/1411.6067.pdf"], "doi": []}, {"id": "0cf8443bcb14cfd6ac5bcf0e3775c0aad45558b4", "title": "CRAFT Objects from Images", "year": "2016", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=7781019"]}, {"id": "3964354a123009c071d493a521cfd0edf4396e66", "title": "Instance Segmentation of Indoor Scenes Using a Coverage Loss", "year": "2014", "pdf": ["http://cs.nyu.edu/~dsontag/papers/SilSonFer_ECCV14.pdf", "http://cs.nyu.edu/~fergus/papers/silbermaneccv2014.pdf", "http://vigir.missouri.edu/~gdesouza/Research/Conference_CDs/ECCV_2014/papers/8689/86890616.pdf"], "doi": ["https://doi.org/10.1007/978-3-319-10590-1_40"]}, {"id": "51ea36ff126f8b4546e46a8876b0a644659fc2f5", "title": "Higher Order Conditional Random Fields in Deep Neural Networks", "year": "2016", "pdf": ["https://arxiv.org/pdf/1511.08119.pdf"], "doi": []}, {"id": "faeda3ca4ff5cc11717147f85d6416f704143120", "title": "Exploring Invariances in Deep Convolutional Neural Networks Using Synthetic Images", "year": "2014", "pdf": ["https://pdfs.semanticscholar.org/d1f5/2a2daaa0421ae40dec1804ff32449175f19b.pdf"], "doi": []}, {"id": "28bc378a6b76142df8762cd3f80f737ca2b79208", "title": "Understanding Objects in Detail with Fine-Grained Attributes", "year": "2014", "pdf": ["http://people.cs.umass.edu/~smaji/papers/oid-cvpr14.pdf", "http://www.cv-foundation.org/openaccess/content_cvpr_2014/papers/Vedaldi_Understanding_Objects_in_2014_CVPR_paper.pdf"], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=6909858", "http://doi.org/10.1109/CVPR.2014.463", "https://www.wikidata.org/entity/Q58050718"]}, {"id": "56466f99025c26a163c8f6a9d31955f090230809", "title": "STC: A Simple to Complex Framework for Weakly-Supervised Semantic Segmentation.", "year": "2017", "pdf": [], "doi": ["https://www.ncbi.nlm.nih.gov/pubmed/28114002", "https://doi.org/10.1109/TPAMI.2016.2636150"]}, {"id": "f0ee079a1f40736e5b7760b38781f090744f37fc", "title": "Contextualizing Object Detection and Classification", "year": "2015", "pdf": [], "doi": ["https://www.ncbi.nlm.nih.gov/pubmed/26353205", "https://doi.org/10.1109/TPAMI.2014.2343217", "https://www.wikidata.org/entity/Q40558547"]}, {"id": "27eca38a375af431430ca458ab3c723c59328634", "title": "ATLAS: A Three-Layered Approach to Facade Parsing", "year": "2015", "pdf": ["https://varcity.ethz.ch/paper/ijcv2015_mathias_atlas.pdf"], "doi": ["https://doi.org/10.1007/s11263-015-0868-z"]}, {"id": "a93d6e82cd500663a8eea02a8e3617632aafe913", "title": "Convolutional Neural Network-based Place Recognition", "year": "2014", "pdf": ["https://arxiv.org/pdf/1411.1509.pdf"], "doi": []}, {"id": "32248e2a2f103cfdfe7e6a944dc0e4373e95d7b8", "title": "Deep Fisher Kernels -- End to End Learning of the Fisher Kernel GMM Parameters", "year": "2014", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=6909578"]}, {"id": "408e8eecc14c5cc60bbdfc486ba7a7fc97031788", "title": "Discriminative Unsupervised Feature Learning with Convolutional Neural Networks", "year": "2014", "pdf": ["https://pdfs.semanticscholar.org/408e/8eecc14c5cc60bbdfc486ba7a7fc97031788.pdf"], "doi": []}, {"id": "3fd90098551bf88c7509521adf1c0ba9b5dfeb57", "title": "Attribute-Based Classification for Zero-Shot Visual Object Categorization", "year": "2014", "pdf": ["http://pub.ist.ac.at/~chl/papers/lampert-pami2013.pdf", "https://staff.fnwi.uva.nl/t.e.j.mensink/zsl2016/zslpubs/lampert13pami.pdf"], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=6571196", "http://doi.org/10.1109/TPAMI.2013.140", "https://www.ncbi.nlm.nih.gov/pubmed/24457503", "https://www.wikidata.org/entity/Q38437353"]}, {"id": "15e024d8f5625ec03c8ac592fbc093687cfb5f02", "title": "The Visual Object Tracking VOT2015 Challenge Results", "year": "2015", "pdf": ["http://cell.missouri.edu/media/publications/Matej-KristanRengarajan_VOT2015-challenge-results_ICCVW-2015.pdf", "http://cmp.felk.cvut.cz/~vojirtom/publications/Kristan2013The.pdf", "http://data.votchallenge.net/vot2015/presentations/vot_2015_paper.pdf", "http://liris.cnrs.fr/Documents/Liris-6875.pdf", "http://www.cv-foundation.org/openaccess/content_iccv_2015_workshops/w14/papers/Kristan_The_Visual_Object_ICCV_2015_paper.pdf", "http://www.epics-project.eu/publications/2013_kristan_iccvw.pdf", "http://www.epics-project.eu/publications/2014_kristan_iccvw.pdf", "https://hal.archives-ouvertes.fr/hal-01336773/file/Kristan2015The.pdf", "https://repositorio.uam.es/bitstream/handle/10486/674992/visual_kristan_ICCVW_2015_ps.pdf?isAllowed=y&sequence=1"], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=7406428", "http://doi.ieeecomputersociety.org/10.1109/ICCVW.2015.79", "http://doi.org/10.1109/ICCVW.2015.79", "https://hal.archives-ouvertes.fr/hal-01336773/document"]}, {"id": "a1bcdb820f6f0dde108996a18eefb239ef0e9566", "title": "Visual Tracking: An Experimental Survey.", "year": "2014", "pdf": [], "doi": ["https://www.ncbi.nlm.nih.gov/pubmed/26353314", "https://doi.org/10.1109/TPAMI.2013.230"]}, {"id": "1af794673d64112edf60f071ca24066e6a227d2b", "title": "Online Object Tracking: A Benchmark", "year": "2013", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=6619156"]}, {"id": "d082f64b8a0a07d105207eb822be58ffb61b353a", "title": "EMOTIC: Emotions in Context Dataset", "year": "2017", "pdf": ["http://openaccess.thecvf.com/content_cvpr_2017_workshops/w41/papers/Lapedriza_EMOTIC_Emotions_in_CVPR_2017_paper.pdf"], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=8015019", "http://doi.ieeecomputersociety.org/10.1109/CVPRW.2017.285", "http://doi.org/10.1109/CVPRW.2017.285"]}, {"id": "2822a883d149956934a20614d6934c6ddaac6857", "title": "A survey of appearance models in visual object tracking", "year": "2013", "pdf": ["https://arxiv.org/pdf/1303.4803.pdf"], "doi": []}, {"id": "f727837e03a039d9bcec6d02cd87256f5a5854a4", "title": "Deep Convolutional Neural Networks for Computer-Aided Detection: CNN Architectures, Dataset Characteristics and Transfer Learning", "year": "2016", "pdf": ["https://arxiv.org/pdf/1602.03409.pdf"], "doi": []}, {"id": "ebe5a4c2dc3ca55a5aeedcd25a98ca6e446ce9cc", "title": "Hippocampal Activity Patterns Carry Information about Objects in Temporal Context", "year": "2014", "pdf": ["http://cogns.northwestern.edu/cbmg/pdfs/2.Hsieh_2014.pdf", "http://dml.ucdavis.edu/uploads/6/1/9/7/61974117/hseih_2014_hippocampal.pdf", "http://orca.cf.ac.uk/96034/7/Hsieh_NEURON-D-13-01629.1.pdf"], "doi": ["https://www.sciencedirect.com/science/article/pii/S0896627314000208", "https://doi.org/10.1016/j.neuron.2014.01.015", "https://www.ncbi.nlm.nih.gov/pubmed/24607234"]}, {"id": "b7d540cd0de72e984cdec44afa4a4d039cfd5eea", "title": "Object Tracking Benchmark", "year": "2015", "pdf": ["http://faculty.ucmerced.edu/mhyang/papers/pami15_tracking_benchmark.pdf"], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=7001050", "http://doi.org/10.1109/TPAMI.2014.2388226", "https://www.ncbi.nlm.nih.gov/pubmed/26353130", "https://www.wikidata.org/entity/Q35768210"]}, {"id": "149e5e5eeea5a9015ab5ae755f62c45ef70fa79b", "title": "Hierarchical Convolutional Features for Visual Tracking", "year": "2015", "pdf": ["http://faculty.ucmerced.edu/mhyang/papers/iccv15_tracking.pdf", "http://openaccess.thecvf.com/content_iccv_2015/papers/Ma_Hierarchical_Convolutional_Features_ICCV_2015_paper.pdf", "http://www.cv-foundation.org/openaccess/content_iccv_2015/papers/Ma_Hierarchical_Convolutional_Features_ICCV_2015_paper.pdf", "https://filebox.ece.vt.edu/~jbhuang/poster/ICCV_2015_HCF_Poster.pdf", "https://filebox.ece.vt.edu/~jbhuang/slides/ICCV_2015_HCF_Slides.pdf"], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=7410709", "http://doi.ieeecomputersociety.org/10.1109/ICCV.2015.352", "http://doi.org/10.1109/ICCV.2015.352"]}, {"id": "142f38642629b9d268999ad876af482177d36697", "title": "Improving Word Representations via Global Context and Multiple Word Prototypes", "year": "2012", "pdf": ["https://pdfs.semanticscholar.org/e3e9/b5257e02608794a1d0396b469869e6021d9c.pdf"], "doi": []}, {"id": "05375a7489f0a84d47a316bacb4d86e8a7bda0df", "title": "Analysis of Scores, Datasets, and Models in Visual Saliency Prediction", "year": "2013", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=6751224"]}, {"id": "58e6eaacaab3fbf9b307a8aec1c614027ff501ce", "title": "Dynamic Eye Movement Datasets and Learnt Saliency Models for Visual Action Recognition", "year": "2012", "pdf": ["http://109.101.234.42/documente/publications/19-62.pdf", "http://sminchisescu.ins.uni-bonn.de/papers/ms12eccv.pdf", "http://web.cs.hacettepe.edu.tr/~erkut/bil722.f12/w09-levent.pdf"], "doi": ["https://doi.org/10.1007/978-3-642-33709-3_60"]}, {"id": "36c91b1342c1357877e89b4c43f8eadb39755c0b", "title": "Recognizing Human-Object Interactions in Still Images by Modeling the Mutual Context of Objects and Human Poses", "year": "2012", "pdf": ["http://cs.stanford.edu/groups/vision/documents/YaoFei-Fei_PAMI2012.pdf", "http://cs.stanford.edu/groups/vision/pdf/yaopami12.pdf", "http://vision.stanford.edu/pdf/yaopami12.pdf"], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=6165303", "http://doi.org/10.1109/TPAMI.2012.67", "https://www.ncbi.nlm.nih.gov/pubmed/22392710", "https://www.wikidata.org/entity/Q34185448"]}, {"id": "5b130e2a1fc3f71b7638cc5dde72481cf33264cc", "title": "Scene Recognition with CNNs: Objects, Scales and Dataset Bias", "year": "2016", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=7780437"]}, {"id": "a2ca5733c08aa206337141f41e746ceb19953037", "title": "Task context impacts visual object processing differentially across the cortex.", "year": "2014", "pdf": ["https://pdfs.semanticscholar.org/a2ca/5733c08aa206337141f41e746ceb19953037.pdf"], "doi": []}, {"id": "0da75bded3ae15e255f5bd376960cfeffa173b4e", "title": "The Role of Context for Object Detection and Semantic Segmentation in the Wild", "year": "2014", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=6909514"]}, {"id": "1883116d33a3e0321d2fe96e0a8a62546aca4ee9", "title": "Visual Question Answering: Datasets, Algorithms, and Future Challenges", "year": "2017", "pdf": ["https://arxiv.org/pdf/1610.01465.pdf"], "doi": []}, {"id": "88c307c51594c6d802080a0780d0d654e2e2891f", "title": "Visual Question Answering: A Survey of Methods and Datasets", "year": "2017", "pdf": ["https://arxiv.org/pdf/1607.05910.pdf"], "doi": []}, {"id": "3cfbb77e5a0e24772cfdb2eb3d4f35dead54b118", "title": "Don't count, predict! A systematic comparison of context-counting vs. context-predicting semantic vectors", "year": "2014", "pdf": ["https://pdfs.semanticscholar.org/2353/17b7ce64b4b3aefe57c1304e8157a4832d2c.pdf"], "doi": []}, {"id": "18e39b6f8f5c538d639bc0b46136ed93b5e3ef35", "title": "A Large Dataset of Object Scans", "year": "2016", "pdf": ["https://arxiv.org/pdf/1602.02481.pdf"], "doi": []}, {"id": "14b4127ef56f57eab19bb48d80ec169e7b1be944", "title": "Deep Reinforcement Learning for Visual Object Tracking in Videos", "year": "2017", "pdf": ["https://arxiv.org/pdf/1701.08936.pdf"], "doi": []}, {"id": "b31d6f201340ecec35bbe0f477710436f860605e", "title": "Learning Video Object Segmentation with Visual Memory", "year": "2017", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=8237742"]}, {"id": "0558c94a094158ecd64f0d5014d3d9668054fb97", "title": "Resilient Distributed Datasets: A Fault-Tolerant Abstraction for In-Memory Cluster Computing", "year": "2012", "pdf": ["https://pdfs.semanticscholar.org/528d/141aba97074977a332bb2d96364b716f246c.pdf"], "doi": []}, {"id": "09a503095db2d68b439e48d67481399198ed0e5b", "title": "Recurrent Models of Visual Attention", "year": "2014", "pdf": ["https://arxiv.org/pdf/1406.6247.pdf"], "doi": []}, {"id": "350d507f5d899e4d7293b1aa951aa0f81b9fd30a", "title": "The Visual Object Tracking VOT2017 Challenge Results", "year": "2017", "pdf": ["http://openaccess.thecvf.com/content_ICCV_2017_workshops/papers/w28/Kristan_The_Visual_Object_ICCV_2017_paper.pdf", "https://hal.archives-ouvertes.fr/hal-01336773/file/Kristan2015The.pdf"], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=8265440", "http://doi.ieeecomputersociety.org/10.1109/ICCVW.2017.230", "http://doi.org/10.1109/ICCVW.2017.230"]}, {"id": "a03c62d4206d4dd0ef4bf8312bfdb0d4971a1123", "title": "Modeling Visual Context Is Key to Augmenting Object Detection Datasets", "year": "2018", "pdf": ["https://arxiv.org/pdf/1807.07428.pdf"], "doi": []}, {"id": "7e232313a59d735ef7c8a9f4cc7bc980a29deb5e", "title": "Making the V in VQA Matter: Elevating the Role of Image Understanding in Visual Question Answering", "year": "2017", "pdf": [], "doi": ["https://doi.org/10.1007/s11263-018-1116-0"]}, {"id": "b4ee2a6b5fdf66f57e94a998cff2acef4af7d256", "title": "Monocular Visual Scene Understanding: Understanding Multi-Object Traffic Scenes", "year": "2013", "pdf": ["https://www.d2.mpi-inf.mpg.de/sites/default/files/wojek2013pami.pdf"], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=6265058", "http://doi.org/10.1109/TPAMI.2012.174", "https://www.ncbi.nlm.nih.gov/pubmed/22889818", "https://www.wikidata.org/entity/Q45823527"]}, {"id": "2ce63d77eecc35faef85a3b752a314c93a077ac9", "title": "Learning Multi-domain Convolutional Neural Networks for Visual Tracking", "year": "2016", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=7780834"]}, {"id": "1c66fa1f3f189ca25bd657f53d77fde64c75f3da", "title": "Adaptive Color Attributes for Real-Time Visual Tracking", "year": "2014", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=6909539"]}, {"id": "eb66303192a89c314ce4acae640ba700fa3293a3", "title": "Unsupervised Object Annotation through Context Analysis", "year": "2013", "pdf": ["https://pdfs.semanticscholar.org/eb66/303192a89c314ce4acae640ba700fa3293a3.pdf"], "doi": []}, {"id": "079ed21601974d0604544a6d816c2f51b5c039b8", "title": "Enriching Visual Knowledge Bases via Object Discovery and Segmentation", "year": "2014", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=6909658"]}, {"id": "7574b7e5a75fdd338c27af5aeb77ab79460c4437", "title": "Learning Dynamic Siamese Network for Visual Object Tracking", "year": "2017", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=8237458"]}, {"id": "38a169b6e67ef7768f91fa208c9b5544f6f57f16", "title": "Object Bank: An Object-Level Image Representation for High-Level Visual Recognition", "year": "2013", "pdf": ["http://cs.stanford.edu/groups/vision/pdf/li_ijcv2013.pdf", "http://vision.stanford.edu/pdf/li_ijcv2013.pdf", "http://www.tpbin.com/Uploads/Subjects/79181d36-c45c-4f6c-821f-b7f9fcac3881.pdf"], "doi": ["http://doi.org/10.1007/s11263-013-0660-x"]}, {"id": "5527dd901b836e2f164c9fa3e62f57cd70c21745", "title": "3D object retrieval via range image queries in a bag-of-visual-words context", "year": "2013", "pdf": ["http://graphics.di.uoa.gr/Downloads/papers/journals/p43.pdf", "http://www.idi.ntnu.no/grupper/vis/wp-content/uploads/2013/09/Range3DRetrievalTVCfinal.pdf"], "doi": ["https://doi.org/10.1007/s00371-013-0876-3"]}, {"id": "5ea8a9ae2bf40c4722e618b732f769744ab57dfe", "title": "Context Driven Scene Parsing with Attention to Rare Classes", "year": "2014", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=6909817"]}, {"id": "2d84f49572c2b29b6c9e1818eb57e7f12bc4236e", "title": "Query-Adaptive Asymmetrical Dissimilarities for Visual Object Retrieval", "year": "2013", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=6751322"]}, {"id": "00319cd17cebae5e1095a248260bd7be15781362", "title": "A Dataset for Improved RGBD-Based Object Detection and Pose Estimation for Warehouse Pick-and-Place", "year": "2016", "pdf": ["https://arxiv.org/pdf/1509.01277.pdf"], "doi": []}, {"id": "0f060f011fe3093a24bf2cde96a4a833f58ec5a5", "title": "Object-based visual query suggestion", "year": "2012", "pdf": ["https://www.researchgate.net/profile/Pierre_Letessier/publication/257627352_Object-based_visual_query_suggestion/links/00b7d5260034959679000000.pdf"], "doi": ["https://doi.org/10.1007/s11042-012-1340-5"]}, {"id": "33baa52f583fb049f473a53d8e0ca5ac8e7abbf2", "title": "Reinforcement Learning for Visual Object Detection", "year": "2016", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=7780685"]}, {"id": "356223d76a850b7d312eec36c70e2f90d78086cc", "title": "Object Categorization Using Local Feature Context", "year": "2013", "pdf": ["http://www.nlpr.ia.ac.cn/2013papers/gjhy/gh75.pdf"], "doi": ["https://doi.org/10.1007/978-3-642-35728-2_31"]}, {"id": "1631bc8b8fe853278b8e54bd3e9fff1445fa9f91", "title": "Visual Distance Measures for Object Retrieval", "year": "2012", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=6411668"]}, {"id": "df4f851e3c37017822a683b1356c6c390b5b5487", "title": "Image Question Answering: A Visual Semantic Embedding Model and a New Dataset", "year": "2015", "pdf": ["https://pdfs.semanticscholar.org/df4f/851e3c37017822a683b1356c6c390b5b5487.pdf"], "doi": []}, {"id": "4a8e9e179b58d3e10448f5e4680b66f34c8bc573", "title": "Learning to segment moving objects in videos", "year": "2015", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=7299035"]}, {"id": "0f6a8e9139cdd15fd0a8a292204aed21a8b51c5a", "title": "ReferItGame: Referring to Objects in Photographs of Natural Scenes", "year": "2014", "pdf": ["https://pdfs.semanticscholar.org/0f6a/8e9139cdd15fd0a8a292204aed21a8b51c5a.pdf"], "doi": []}, {"id": "1ced31e02234bc3d1092ffb2c7442ffbd51cb309", "title": "A Large Dataset to Train Convolutional Networks for Disparity, Optical Flow, and Scene Flow Estimation", "year": "2016", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=7780807"]}, {"id": "5ac18d505ed6d10e8692cbb7d33f6852e6782692", "title": "The Open Images Dataset V4: Unified image classification, object detection, and visual relationship detection at scale", "year": "2018", "pdf": ["https://arxiv.org/pdf/1811.00982.pdf"], "doi": []}, {"id": "efa08283656714911acff2d5022f26904e451113", "title": "Active Object Localization in Visual Situations", "year": "2016", "pdf": ["https://arxiv.org/pdf/1607.00548.pdf"], "doi": []}, {"id": "1f7127b9ae86d7fac305c6b824801e455e82f511", "title": "Visual relationship detection with object spatial distribution", "year": "2017", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=8019448", "http://doi.ieeecomputersociety.org/10.1109/ICME.2017.8019448", "http://doi.org/10.1109/ICME.2017.8019448"]}, {"id": "051830b0ea58d1568f19ec3297e301d9789c9a76", "title": "Bringing Semantics into Focus Using Visual Abstraction", "year": "2013", "pdf": ["http://courses.cs.washington.edu/courses/cse590v/13au/cse590v_au13_wk5_abstract_scenes.pdf", "http://courses.cs.washington.edu/courses/cse590v/13au/cse590v_au13_wk5_abstract_scenes_rob.pdf", "http://vigir.missouri.edu/~gdesouza/Research/Conference_CDs/IEEE_CVPR2013/data/Papers/4989d009.pdf", "http://www.cv-foundation.org/openaccess/content_cvpr_2013/papers/Zitnick_Bringing_Semantics_into_2013_CVPR_paper.pdf", "https://filebox.ece.vt.edu/~parikh/Publications/ZitnickParikh_CVPR_2013_clipart.pdf"], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=6619231", "http://doi.ieeecomputersociety.org/10.1109/CVPR.2013.387", "http://doi.org/10.1109/CVPR.2013.387"]}, {"id": "64c4019f1ea9b54b1848418ac53c4e2584dc62d4", "title": "ActionNet-VE Dataset: A Dataset for Describing Visual Events by Extending VIRAT Ground 2.0", "year": "2015", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=7433003"]}, {"id": "8113a6d723c6f6dd2ff9808cf745480f16abc3f9", "title": "Attentional Network for Visual Object Detection", "year": "2017", "pdf": ["https://arxiv.org/pdf/1702.01478.pdf"], "doi": []}, {"id": "9a8e61cc9a95efe9e35df4d4230c7b8a655b7392", "title": "Unsupervised Joint Object Discovery and Segmentation in Internet Images", "year": "2013", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=6619097"]}, {"id": "19d6b9725a59f4b624205829d5f03ac893ca1367", "title": "Long-Term Visual Object Tracking Benchmark", "year": "2017", "pdf": ["https://arxiv.org/pdf/1712.01358.pdf"], "doi": []}, {"id": "022027ce7475029f78fb3cdb758d947a8978ab5c", "title": "Invariant visual object recognition: biologically plausible approaches", "year": "2015", "pdf": ["http://wrap.warwick.ac.uk/77413/1/WRAP_422_2015_Article_658.pdf", "http://www.oxcns.org/papers/554%20Robinson%20Rolls%202015%20Invariant%20visual%20object%20recognition%20Biologically%20plausible%20models.pdf"], "doi": ["https://doi.org/10.1007/s00422-015-0658-2", "https://www.ncbi.nlm.nih.gov/pubmed/26335743", "https://www.wikidata.org/entity/Q43248757"]}, {"id": "e8e662e45e39249756d2b0090782434a5cf1f4aa", "title": "VegFru: A Domain-Specific Dataset for Fine-Grained Visual Categorization", "year": "2017", "pdf": ["http://openaccess.thecvf.com/content_ICCV_2017/papers/Hou_VegFru_A_Domain-Specific_ICCV_2017_paper.pdf", "http://openaccess.thecvf.com/content_ICCV_2017/supplemental/Hou_VegFru_A_Domain-Specific_ICCV_2017_supplemental.pdf"], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=8237328", "http://doi.ieeecomputersociety.org/10.1109/ICCV.2017.66", "http://doi.org/10.1109/ICCV.2017.66"]}, {"id": "54c7c3909c7e1e827befdbe8d2595a3b196ba1b8", "title": "AVA: A Video Dataset of Spatio-Temporally Localized Atomic Visual Actions", "year": "2018", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=8578731"]}, {"id": "ac6c28cd866bccbbca54da8b7bd5b2e0d5e9d0b4", "title": "Cross-Dataset Learning of Visual Concepts", "year": "2012", "pdf": ["https://hpi.de/fileadmin/user_upload/fachgebiete/meinel/Semantic-Technologies/paper/amr2012.pdf"], "doi": ["https://doi.org/10.1007/978-3-319-12093-5_4"]}, {"id": "bbe7f4217a9bd9c6d3826b5b62d59d183e729383", "title": "Discriminative Hough context model for object detection", "year": "2013", "pdf": [], "doi": ["https://doi.org/10.1007/s00371-013-0780-x"]}, {"id": "55ca9fe4ae98904bfe026d22dcf1420ff9c0dd86", "title": "Dataset for Visual Reasoning", "year": "2017", "pdf": [], "doi": []}, {"id": "20f9a09defe5b02b98c464ca6df36b3b6358f60b", "title": "The State-of-the-Art in Visual Object Tracking", "year": "2012", "pdf": ["https://pdfs.semanticscholar.org/cd46/4a309fa1736e1373f0bb06baf75e3d0abcac.pdf"], "doi": []}, {"id": "d86fabd4498c8feaed80ec342d254fb877fb92f5", "title": "Region-Object Relevance-Guided Visual Relationship Detection", "year": "2018", "pdf": ["https://pdfs.semanticscholar.org/d86f/abd4498c8feaed80ec342d254fb877fb92f5.pdf"], "doi": []}, {"id": "aa0dbfcc3cf172971cc5679c02add3f291c8f886", "title": "The dynamics of invariant object recognition in the human visual system.", "year": "2014", "pdf": ["https://pdfs.semanticscholar.org/aa0d/bfcc3cf172971cc5679c02add3f291c8f886.pdf"], "doi": []}, {"id": "4405b44b5597787c42abeca6d0b3172175557b7b", "title": "Object discovery in 3D scenes via shape analysis", "year": "2013", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=6630857"]}, {"id": "7df07834ddde670cd6c626025e0c769837e266ea", "title": "Visual Saliency Detection Based Object Recognition", "year": "2015", "pdf": ["https://pdfs.semanticscholar.org/7df0/7834ddde670cd6c626025e0c769837e266ea.pdf"], "doi": []}, {"id": "8da0771e47c32405c4877cedce3ff84ac7390646", "title": "A survey of datasets for visual tracking", "year": "2015", "pdf": ["http://www.isir.upmc.fr/files/2015ACLI3545.pdf"], "doi": ["https://doi.org/10.1007/s00138-015-0713-y", "http://hal.upmc.fr/hal-01217152/document"]}, {"id": "4a75c3441cef2069458fe61a01196c2c8b32ee92", "title": "Single-trial classification of EEG in a visual object task using ICA and machine learning", "year": "2014", "pdf": ["https://www.research.ed.ac.uk/portal/files/14632594/Stewart.JNeurosciMeth.228.2014.pdf"], "doi": ["https://www.sciencedirect.com/science/article/pii/S0165027014000752", "https://doi.org/10.1016/j.jneumeth.2014.02.014", "https://www.ncbi.nlm.nih.gov/pubmed/24613798"]}, {"id": "1456f147381bf7c385225d854c2fb48c19eca285", "title": "LCAV-31: a dataset for light field object recognition", "year": "2014", "pdf": ["http://infoscience.epfl.ch/record/197737/files/902014.pdf"], "doi": ["http://doi.org/10.1117/12.2041097"]}, {"id": "2f17f59c2e3b71ff8d35677b7c0d0949a3f804a8", "title": "The Role of Context Selection in Object Detection", "year": "2016", "pdf": ["https://arxiv.org/pdf/1609.02948.pdf"], "doi": []}, {"id": "03dbc94b54c85cc34815df629fb508c6729e6eab", "title": "LSUN: Construction of a Large-scale Image Dataset using Deep Learning with Humans in the Loop", "year": "2015", "pdf": ["https://arxiv.org/pdf/1506.03365.pdf"], "doi": []}, {"id": "d7ed761cfe1b71aa7e4d08c355fcab131558f8c8", "title": "Learning Object Models on a Robot using Visual Context and Appearance Cues", "year": "2013", "pdf": ["https://pdfs.semanticscholar.org/d7ed/761cfe1b71aa7e4d08c355fcab131558f8c8.pdf"], "doi": []}, {"id": "d53c79cce46820642f2d4e0f0dac9b31d1201f24", "title": "Visual object trapping", "year": "2016", "pdf": [], "doi": ["https://doi.org/10.1016/j.cviu.2016.07.007"]}, {"id": "06064cddc8c3d0f270e09007dbeb27ff320d5e0d", "title": "Similarity-Based Fusion of MEG and fMRI Reveals Spatio-Temporal Dynamics in Human Cortex During Visual Object Recognition", "year": "2016", "pdf": ["https://pdfs.semanticscholar.org/7133/189b3532d268d581566b5730148fe9296a8d.pdf"], "doi": []}, {"id": "5ffd74d2873b7cba2cbc5fd295cc7fbdedca22a2", "title": "The Cityscapes Dataset", "year": "2015", "pdf": [], "doi": []}, {"id": "14ca963b4e0b87fc7213b8e3a3e2371cee7ffad6", "title": "Exploring Causal Relationships in Visual Object Tracking", "year": "2015", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=7410708"]}, {"id": "f9c602cc436a9ea2f9e7db48c77d924e09ce3c32", "title": "Fashion-MNIST: a Novel Image Dataset for Benchmarking Machine Learning Algorithms", "year": "2017", "pdf": ["https://arxiv.org/pdf/1708.07747.pdf"], "doi": []}, {"id": "3ecb007d46614d5e5566b0ad7c96c0c4c8ac0d14", "title": "Enhancing Object Recognition With Dynamic Cognitive Context", "year": "2016", "pdf": ["https://pdfs.semanticscholar.org/3ecb/007d46614d5e5566b0ad7c96c0c4c8ac0d14.pdf"], "doi": []}, {"id": "c8018f3dc6121d92da37f1756e7bd11a128aa55c", "title": "Region Filling and Object Removal by Exemplar based Image Inpainting", "year": "2015", "pdf": ["https://pdfs.semanticscholar.org/c801/8f3dc6121d92da37f1756e7bd11a128aa55c.pdf"], "doi": []}, {"id": "051d8bbf12877c46ae9a598a386c5b72d1b103ac", "title": "Object Detection using Geometrical Context Feedback", "year": "2012", "pdf": ["http://cvgl.stanford.edu/papers/Sun_IJCV_2012.pdf"], "doi": ["http://doi.org/10.1007/s11263-012-0547-2"]}, {"id": "b0cd469a06fb2eae3a5cc0c860aa592f71b13f6d", "title": "IQA: Visual Question Answering in Interactive Environments", "year": "2018", "pdf": [], "doi": ["http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=8578528"]}]}