diff options
Diffstat (limited to 'site/content/pages/datasets')
41 files changed, 147 insertions, 70 deletions
diff --git a/site/content/pages/datasets/50_people_one_question/assets/background.gif b/site/content/pages/datasets/50_people_one_question/assets/background.gif Binary files differnew file mode 100644 index 00000000..a0539bbb --- /dev/null +++ b/site/content/pages/datasets/50_people_one_question/assets/background.gif diff --git a/site/content/pages/datasets/50_people_one_question/assets/background.jpg b/site/content/pages/datasets/50_people_one_question/assets/background.jpg Binary files differnew file mode 100644 index 00000000..f7567314 --- /dev/null +++ b/site/content/pages/datasets/50_people_one_question/assets/background.jpg diff --git a/site/content/pages/datasets/50_people_one_question/assets/background_02.jpg b/site/content/pages/datasets/50_people_one_question/assets/background_02.jpg Binary files differnew file mode 100644 index 00000000..f20ee861 --- /dev/null +++ b/site/content/pages/datasets/50_people_one_question/assets/background_02.jpg diff --git a/site/content/pages/datasets/50_people_one_question/assets/index.jpg b/site/content/pages/datasets/50_people_one_question/assets/index.jpg Binary files differnew file mode 100644 index 00000000..7bf4ed1d --- /dev/null +++ b/site/content/pages/datasets/50_people_one_question/assets/index.jpg diff --git a/site/content/pages/datasets/50_people_one_question/assets/index_02.jpg b/site/content/pages/datasets/50_people_one_question/assets/index_02.jpg Binary files differnew file mode 100644 index 00000000..347bd08d --- /dev/null +++ b/site/content/pages/datasets/50_people_one_question/assets/index_02.jpg diff --git a/site/content/pages/datasets/brainwash/assets/background.jpg b/site/content/pages/datasets/brainwash/assets/background.jpg Binary files differnew file mode 100644 index 00000000..eada1779 --- /dev/null +++ b/site/content/pages/datasets/brainwash/assets/background.jpg diff --git a/site/content/pages/datasets/brainwash/assets/index.jpg b/site/content/pages/datasets/brainwash/assets/index.jpg Binary files differnew file mode 100644 index 00000000..c903baea --- /dev/null +++ b/site/content/pages/datasets/brainwash/assets/index.jpg diff --git a/site/content/pages/datasets/caltech_10k/index.md b/site/content/pages/datasets/caltech_10k/index.md new file mode 100644 index 00000000..8f49f2d1 --- /dev/null +++ b/site/content/pages/datasets/caltech_10k/index.md @@ -0,0 +1,29 @@ +------------ + +status: published +title: Caltech 10K Faces Dataset +desc: Caltech 10K Faces Dataset +slug: caltech_10k +published: 2019-2-23 +updated: 2019-2-23 +authors: Adam Harvey + +------------ + +# Caltech 10K Faces Dataset + ++ Years: TBD ++ Images: TBD ++ Identities: TBD ++ Origin: Google Search ++ Funding: TBD + +------- + +Ignore text below these lines + +------- + +Research + +The dataset contains images of people collected from the web by typing common given names into Google Image Search. The coordinates of the eyes, the nose and the center of the mouth for each frontal face are provided in a ground truth file. This information can be used to align and crop the human faces or as a ground truth for a face detection algorithm. The dataset has 10,524 human faces of various resolutions and in different settings, e.g. portrait images, groups of people, etc. Profile faces or very low resolution faces are not labeled.
\ No newline at end of file diff --git a/site/content/pages/datasets/duke_mtmc/assets/background.jpg b/site/content/pages/datasets/duke_mtmc/assets/background.jpg Binary files differnew file mode 100644 index 00000000..fb76d97f --- /dev/null +++ b/site/content/pages/datasets/duke_mtmc/assets/background.jpg diff --git a/site/content/pages/datasets/duke_mtmc/assets/index.jpg b/site/content/pages/datasets/duke_mtmc/assets/index.jpg Binary files differnew file mode 100644 index 00000000..89b7b08d --- /dev/null +++ b/site/content/pages/datasets/duke_mtmc/assets/index.jpg diff --git a/site/content/pages/datasets/facebook/index.md b/site/content/pages/datasets/facebook/index.md new file mode 100644 index 00000000..6e3857fd --- /dev/null +++ b/site/content/pages/datasets/facebook/index.md @@ -0,0 +1,32 @@ +------------ + +status: published +title: Facebook +desc: TBD +subdesc: TBD +image: assets/background.jpg +caption: TBD +slug: facebook +published: 2019-2-23 +updated: 2019-2-23 +color: #aaaaff +authors: Adam Harvey + +------------ + +### Statistics + ++ Years: 2002-2004 ++ Images: 13,233 ++ Identities: 5,749 ++ Origin: Yahoo News Images ++ Funding: (Possibly, partially CIA) + +---- + +Ignore content below these lines + +--- + + +- Tool to create face datasets from Facebook <https://github.com/ankitaggarwal011/FaceGrab> diff --git a/site/content/pages/datasets/helen/assets/background.jpg b/site/content/pages/datasets/helen/assets/background.jpg Binary files differnew file mode 100644 index 00000000..63ebb8c9 --- /dev/null +++ b/site/content/pages/datasets/helen/assets/background.jpg diff --git a/site/content/pages/datasets/helen/assets/index.jpg b/site/content/pages/datasets/helen/assets/index.jpg Binary files differnew file mode 100644 index 00000000..9e62679b --- /dev/null +++ b/site/content/pages/datasets/helen/assets/index.jpg diff --git a/site/content/pages/datasets/hrt_transgender/assets/background.jpg b/site/content/pages/datasets/hrt_transgender/assets/background.jpg Binary files differnew file mode 100644 index 00000000..9437c4ff --- /dev/null +++ b/site/content/pages/datasets/hrt_transgender/assets/background.jpg diff --git a/site/content/pages/datasets/hrt_transgender/assets/index.jpg b/site/content/pages/datasets/hrt_transgender/assets/index.jpg Binary files differnew file mode 100644 index 00000000..428ac42a --- /dev/null +++ b/site/content/pages/datasets/hrt_transgender/assets/index.jpg diff --git a/site/content/pages/datasets/ilids_vid/assets/background.jpg b/site/content/pages/datasets/ilids_vid/assets/background.jpg Binary files differnew file mode 100644 index 00000000..6acd30e8 --- /dev/null +++ b/site/content/pages/datasets/ilids_vid/assets/background.jpg diff --git a/site/content/pages/datasets/ilids_vid/assets/index.jpg b/site/content/pages/datasets/ilids_vid/assets/index.jpg Binary files differnew file mode 100644 index 00000000..66c80d7d --- /dev/null +++ b/site/content/pages/datasets/ilids_vid/assets/index.jpg diff --git a/site/content/pages/datasets/index.md b/site/content/pages/datasets/index.md new file mode 100644 index 00000000..fa012758 --- /dev/null +++ b/site/content/pages/datasets/index.md @@ -0,0 +1,22 @@ +------------ + +status: published +title: MegaPixels: Datasets +desc: Facial Recognition Datasets +slug: home +published: 2018-12-15 +updated: 2018-12-15 +authors: Adam Harvey +sync: false + +------------ + +# Facial Recognition Datasets + ++ Found: 275 datasets ++ Created between: 1993-2018 ++ Smallest dataset: 20 images ++ Largest dataset: 10,000,000 images + ++ Highest resolution faces: 450x500 (Unconstrained College Students) ++ Lowest resolution faces: 16x20 pixels (QMUL SurvFace) diff --git a/site/content/pages/datasets/lfw/assets/background.jpg b/site/content/pages/datasets/lfw/assets/background.jpg Binary files differnew file mode 100644 index 00000000..3ab1607d --- /dev/null +++ b/site/content/pages/datasets/lfw/assets/background.jpg diff --git a/site/content/pages/datasets/lfw/assets/index.jpg b/site/content/pages/datasets/lfw/assets/index.jpg Binary files differnew file mode 100644 index 00000000..bc36c106 --- /dev/null +++ b/site/content/pages/datasets/lfw/assets/index.jpg diff --git a/site/content/pages/datasets/lfw/assets/lfw_commercial_use.csv b/site/content/pages/datasets/lfw/assets/lfw_commercial_use.csv index 70e2fdeb..a2a4b39c 100644 --- a/site/content/pages/datasets/lfw/assets/lfw_commercial_use.csv +++ b/site/content/pages/datasets/lfw/assets/lfw_commercial_use.csv @@ -1,44 +1,44 @@ "name_display","company_url","example_url","country","description" -"Aratek","http://www.aratek.co/","","China","Biometric sensors for telecom, civil identification, finance, education, POS, and transportation" -"Asaphus","https://asaphus.de/","","Germany","Face recognition for home appliances and autonomous vehicles interaction" -"Aureus","https://cyberextruder.com/biometric-face-recognition-software-use-cases/","","USA","Retail loss prevention solutions, biometric access control, law enforcement and safe city applications, gaming and hospitality applications" +"Aratek","http://www.aratek.co/"," ","China","Biometric sensors for telecom, civil identification, finance, education, POS, and transportation" +"Asaphus","https://asaphus.de/"," ","Germany","Face recognition for home appliances and autonomous vehicles interaction" +"Aureus","https://cyberextruder.com/biometric-face-recognition-software-use-cases/"," ","USA","Retail loss prevention solutions, biometric access control, law enforcement and safe city applications, gaming and hospitality applications" "Baidu","http://research.baidu.com/institute-of-deep-learning/","https://www.newscientist.com/article/2113176-chinese-tourist-town-uses-face-recognition-as-an-entry-pass/","China","Retail payment, transportation, civil identification" -"Betaface","https://www.betaface.com/","","Germany","Web advertising and entertainment, video surveillance, security software, b2b software" -"Yi+AI","http://www.dress-plus.com/solution","","China","Scenario-based advertising, real-time personalized recommendation, character recognition for ads placement" -"CM-CV&AR","http://www.cloudminds.com/","","USA","Human augmented robot intelligence" -"Samtech","http://samtechinfonet.com/products_frs.php","","India","Facilities management, infrastructure support" -"ColorReco","http://www.colorreco.com/","","China","Face login verification, online payment security verification, access control system identity authentication and face recognition lock, mobile payment, driver fatigue recognition, virtual makeup" +"Betaface","https://www.betaface.com/"," ","Germany","Web advertising and entertainment, video surveillance, security software, b2b software" +"Yi+AI","http://www.dress-plus.com/solution"," ","China","Scenario-based advertising, real-time personalized recommendation, character recognition for ads placement" +"CM-CV&AR","http://www.cloudminds.com/"," ","USA","Human augmented robot intelligence" +"Samtech","http://samtechinfonet.com/products_frs.php"," ","India","Facilities management, infrastructure support" +"ColorReco","http://www.colorreco.com/"," ","China","Face login verification, online payment security verification, access control system identity authentication and face recognition lock, mobile payment, driver fatigue recognition, virtual makeup" "CloudWalk","www.cloudwalk.cn/","https://qz.com/africa/1287675/china-is-exporting-facial-recognition-to-africa-ensuring-ai-dominance-through-diversity/","China","Security and law enforcement. Being deployed in Zimbabwe" -"Cylltech","http://www.cylltech.com.cn/","","China","Conference management, social assistance, civil access, media orientation, precision marketing, scenic intelligence, tourism management" +"Cylltech","http://www.cylltech.com.cn/"," ","China","Conference management, social assistance, civil access, media orientation, precision marketing, scenic intelligence, tourism management" "Dahua-FaceImage","https://www.dahuasecurity.com/","https://www.dahuasecurity.com/solutions/solutionsbyapplication/23","China","Public security, public access control, finance" -"Daream","http://www.daream.com","","China","Fatigue and distraction detection for autonomous vehicles" -"Deepmark","https://deepmark.ru/","","Russia","Workplace access control" -"Easen Electron","http://www.easen-electron.com","","China","Face recognition door locks for automobiles" -"Ever AI","https://ever.ai/","","USA","Law enforcement, smart cities, surveillance, building security, retail, payments, autonomous vehicles, grocery stores, enhanced marketing" -"Facebook (Face.com)","https://en.wikipedia.org/wiki/Face.com","","USA","Sold to facebook in 2012, and now incorporated into DeepFace" -"Face++","https://www.faceplusplus.com/","","China","Audience engagement analysis, interactive marketing, gaming, photo album processing, security for mobile payments" -"Faceall","http://www.faceall.cn/index.en.html","","China","Internet banking, insurance, automated surveillance, access control, photo refinement, avatar creation" -"Faceter","https://faceter.io","","USA","Workforce attendence reporting and analytics, home video surveillance, retail customer behavior, GPU mining compatible" -"Facevisa","http://www.facevisa.com","","China","Face detection, face key point positioning, living body certification, facial attribute analysis" -"Fujitsu R&D","https://www.fujitsu.com/cn/en/about/local/subsidiaries/frdc/","","Japan","Consumer cameras" -"SenseTime","https://www.sensetime.com/","","Hong Kong","Surveillance, access control, image retrieval, and automatic log-on for personal computer or mobile devices" +"Daream","http://www.daream.com"," ","China","Fatigue and distraction detection for autonomous vehicles" +"Deepmark","https://deepmark.ru/"," ","Russia","Workplace access control" +"Easen Electron","http://www.easen-electron.com"," ","China","Face recognition door locks for automobiles" +"Ever AI","https://ever.ai/"," ","USA","Law enforcement, smart cities, surveillance, building security, retail, payments, autonomous vehicles, grocery stores, enhanced marketing" +"Facebook (Face.com)","https://en.wikipedia.org/wiki/Face.com"," ","USA","Sold to facebook in 2012, and now incorporated into DeepFace" +"Face++","https://www.faceplusplus.com/"," ","China","Audience engagement analysis, interactive marketing, gaming, photo album processing, security for mobile payments" +"Faceall","http://www.faceall.cn/index.en.html"," ","China","Internet banking, insurance, automated surveillance, access control, photo refinement, avatar creation" +"Faceter","https://faceter.io"," ","USA","Workforce attendence reporting and analytics, home video surveillance, retail customer behavior, GPU mining compatible" +"Facevisa","http://www.facevisa.com"," ","China","Face detection, face key point positioning, living body certification, facial attribute analysis" +"Fujitsu R&D","https://www.fujitsu.com/cn/en/about/local/subsidiaries/frdc/"," ","Japan","Consumer cameras" +"SenseTime","https://www.sensetime.com/"," ","Hong Kong","Surveillance, access control, image retrieval, and automatic log-on for personal computer or mobile devices" "Turing Robot","http://www.tuling123.com/","http://biz.turingos.cn/home","China","Emotion recognition and analysis for robots and toys, chatbots and digital assistants" "NEC","https://www.nec.com/en/press/201407/global_20140716_01.html","https://arxiv.org/abs/1212.6094","Japan","Law enforcement, event crowd monitoring, used specificallfy by Metropolitan police in UK" -"Aurora","http://auroracs.co.uk/","","UK","Face recognition in airports for security, queue management, x-ray divestment tray linkage" +"Aurora","http://auroracs.co.uk/"," ","UK","Face recognition in airports for security, queue management, x-ray divestment tray linkage" "VisionLabs","https://visionlabs.ai/","https://venturebeat.com/2016/07/07/russian-facial-recognition-startup-visionlabs-raises-5-5m-after-partnering-with-facebook-and-google/","Russia","Video surveillance, banking and finance, customer authentication for retail" -"Yunshitu","http://yunshitu.cn","","China","Security, Internet, broadcasting and other industries" -"Glasssix","http://www.glasssix.com/","","China","School attendance, workforce monitoring" +"Yunshitu","http://yunshitu.cn"," ","China","Security, Internet, broadcasting and other industries" +"Glasssix","http://www.glasssix.com/"," ","China","School attendance, workforce monitoring" "Hisign","http://www.hisign.com.cn/en-us/index.aspx","https://www.bloomberg.com/research/stocks/private/snapshot.asp?privcapId=52323181","China","Criminal investigation information application, and financial big data risk prevention and control products in China" "icarevision","http://www.icarevision.cn","https://www.bloomberg.com/research/stocks/private/snapshot.asp?privcapId=306707800","China","Video surveillance" "IntelliVision","https://www.intelli-vision.com/facial-recognition/","https://www.bloomberg.com/profiles/companies/0080393D:US-intellivision-technologies-corp","USA","Smart homes and buildings, smart security, smart city, smart retail, Smart auto" "Meiya Pico","https://meiyapico.com/","https://www.bloomberg.com/research/stocks/private/snapshot.asp?privcapId=117577345","China","Digital forensics and information security products and services in China" "Orion Star","https://www.ainirobot.com/#sixthPage","https://www.prnewswire.com/news-releases/orionstar-wins-challenge-to-recognize-one-million-celebrity-faces-with-artificial-intelligence-300494265.html","China","Face recognition for robots and livestream video censoring" -"Pegatron","http://www.pegatroncorp.com","","China","Workforce attendance" +"Pegatron","http://www.pegatroncorp.com"," ","China","Workforce attendance" "PingAn AI Lab","http://www.pingan.com/","https://www.biometricupdate.com/201703/ping-an-technology-developing-ai-face-recognition-technology-with-record-results","China","Financial services, lending" -"ReadSense","http://www.readsense.ai/","","China","Access control, traffic analysis, crowd analysis, head counting, drone vision, home appliances, community surveillance, custom attention analysis" -"sensingtech","www.sensingtech.com.cn","","China","Workplace entrypoint authentication" -"TCIT","http://www.tcit-us.com/?p=4023","","Taiwan","Retail analytics, workplace access control" -"TerminAI","terminai.com","","China","Smart office, smart city, smart gym, smart medical, smart community" -"Uni-Ubi","http://uni-ubi.com/","","China","Facial recognition for education, business, community, construction" -"Tencent YouTu Lab","http://bestimage.qq.com/","","China","Consumer applications for automatic facial beauty" -"Yuntu WiseSight","http://www.facelab.cn/","","China","Intrusion alarm, access control, access control, electronic patrol, and network alarm. detect suspicious personnel, real-name authentication, and public security, customs, airports, railways and other government security agencies, electronic patrol"
\ No newline at end of file +"ReadSense","http://www.readsense.ai/"," ","China","Access control, traffic analysis, crowd analysis, head counting, drone vision, home appliances, community surveillance, custom attention analysis" +"sensingtech","www.sensingtech.com.cn"," ","China","Workplace entrypoint authentication" +"TCIT","http://www.tcit-us.com/?p=4023"," ","Taiwan","Retail analytics, workplace access control" +"TerminAI","terminai.com"," ","China","Smart office, smart city, smart gym, smart medical, smart community" +"Uni-Ubi","http://uni-ubi.com/"," ","China","Facial recognition for education, business, community, construction" +"Tencent YouTu Lab","http://bestimage.qq.com/"," ","China","Consumer applications for automatic facial beauty" +"Yuntu WiseSight","http://www.facelab.cn/"," ","China","Intrusion alarm, access control, access control, electronic patrol, and network alarm. detect suspicious personnel, real-name authentication, and public security, customs, airports, railways and other government security agencies, electronic patrol"
\ No newline at end of file diff --git a/site/content/pages/datasets/lfw/assets/lfw_index.gif b/site/content/pages/datasets/lfw/assets/lfw_index.gif Binary files differdeleted file mode 100644 index 63a5c423..00000000 --- a/site/content/pages/datasets/lfw/assets/lfw_index.gif +++ /dev/null diff --git a/site/content/pages/datasets/lfw/assets/lfw_montage.jpg b/site/content/pages/datasets/lfw/assets/lfw_montage.jpg Binary files differdeleted file mode 100644 index 8d73c417..00000000 --- a/site/content/pages/datasets/lfw/assets/lfw_montage.jpg +++ /dev/null diff --git a/site/content/pages/datasets/lfw/assets/lfw_synthetic.jpg b/site/content/pages/datasets/lfw/assets/lfw_synthetic.jpg Binary files differdeleted file mode 100644 index c2a34043..00000000 --- a/site/content/pages/datasets/lfw/assets/lfw_synthetic.jpg +++ /dev/null diff --git a/site/content/pages/datasets/lfw/index.md b/site/content/pages/datasets/lfw/index.md index 1f847a2a..4161561d 100644 --- a/site/content/pages/datasets/lfw/index.md +++ b/site/content/pages/datasets/lfw/index.md @@ -2,60 +2,64 @@ status: published title: Labeled Faces in The Wild -desc: LFW: Labeled Faces in The Wild +desc: Labeled Faces in The Wild (LFW) is a database of face photographs designed for studying the problem of unconstrained face recognition. +subdesc: It includes 13,456 images of 4,432 people’s images copied from the Internet during 2002-2004. +image: assets/background.jpg +caption: A few of the 5,749 people in the Labeled Faces in the Wild Dataset. The most widely used face dataset for benchmarking commercial face recognition algorithms. slug: lfw published: 2019-2-23 updated: 2019-2-23 +color: #ff0000 authors: Adam Harvey ------------ -# LFW +### Statistics + Years: 2002-2004 + Images: 13,233 + Identities: 5,749 + Origin: Yahoo News Images -+ Funding: (Possibly, partially CIA*) ++ Funding: (Possibly, partially CIA) - - -*Labeled Faces in The Wild* (LFW) is "a database of face photographs designed for studying the problem of unconstrained face recognition[^lfw_www]. It is used to evaluate and improve the performance of facial recognition algorithms in academic, commercial, and government research. According to BiometricUpdate.com[^lfw_pingan], LFW is "the most widely used evaluation set in the field of facial recognition, LFW attracts a few dozen teams from around the globe including Google, Facebook, Microsoft Research Asia, Baidu, Tencent, SenseTime, Face++ and Chinese University of Hong Kong." - -The LFW dataset includes 13,233 images of 5,749 people that were collected between 2002-2004. LFW is a subset of *Names of Faces* and is part of the first facial recognition training dataset created entirely from images appearing on the Internet. The people appearing in LFW are... - -The *Names and Faces* dataset was the first face recognition dataset created entire from online photos. However, *Names and Faces* and *LFW* are not the first face recognition dataset created entirely "in the wild". That title belongs to the [UCD dataset](/datasets/ucd_faces/). Images obtained "in the wild" means using an image without explicit consent or awareness from the subject or photographer. - - -### Analysis +### INSIGHTS - There are about 3 men for every 1 woman (4,277 men and 1,472 women) in the LFW dataset[^lfw_www] - The person with the most images is [George W. Bush](http://vis-www.cs.umass.edu/lfw/person/George_W_Bush_comp.html) with 530 - There are about 3 George W. Bush's for every 1 [Tony Blair](http://vis-www.cs.umass.edu/lfw/person/Tony_Blair.html) -- 70% of people in the dataset have only 1 image and 29% have 2 or more images - The LFW dataset includes over 500 actors, 30 models, 10 presidents, 124 basketball players, 24 football players, 11 kings, 7 queens, and 1 [Moby](http://vis-www.cs.umass.edu/lfw/person/Moby.html) - In all 3 of the LFW publications [^lfw_original_paper], [^lfw_survey], [^lfw_tech_report] the words "ethics", "consent", and "privacy" appear 0 times - The word "future" appears 71 times -### Synthetic Faces +## Labeled Faces in the Wild -To visualize the types of photos in the dataset without explicitly publishing individual's identities a generative adversarial network (GAN) was trained on the entire dataset. The images in this video show a neural network learning the visual latent space and then interpolating between archetypical identities within the LFW dataset. +*Labeled Faces in The Wild* (LFW) is "a database of face photographs designed for studying the problem of unconstrained face recognition[^lfw_www]. It is used to evaluate and improve the performance of facial recognition algorithms in academic, commercial, and government research. According to BiometricUpdate.com[^lfw_pingan], LFW is "the most widely used evaluation set in the field of facial recognition, LFW attracts a few dozen teams from around the globe including Google, Facebook, Microsoft Research Asia, Baidu, Tencent, SenseTime, Face++ and Chinese University of Hong Kong." - +The LFW dataset includes 13,233 images of 5,749 people that were collected between 2002-2004. LFW is a subset of *Names of Faces* and is part of the first facial recognition training dataset created entirely from images appearing on the Internet. The people appearing in LFW are... +The *Names and Faces* dataset was the first face recognition dataset created entire from online photos. However, *Names and Faces* and *LFW* are not the first face recognition dataset created entirely "in the wild". That title belongs to the [UCD dataset](/datasets/ucd_faces/). Images obtained "in the wild" means using an image without explicit consent or awareness from the subject or photographer. ### Biometric Trade Routes -To understand how this dataset has been used, its citations have been geocoded to show an approximate geographic digital trade route of the biometric data. Lines indicate an organization (education, commercial, or governmental) that has cited the LFW dataset in their research. Data is compiled from [SemanticScholar](https://www.semanticscholar.org). +To understand how this dataset has been used, its citations have been geocoded to show an approximate geographic digital trade route of the biometric data. Lines indicate an organization (education, commercial, or governmental) that has cited the LFW dataset in their research. Data is compiled from [Semantic Scholar](https://www.semanticscholar.org). -[add map here] +``` +map +``` + +### Synthetic Faces + +To visualize the types of photos in the dataset without explicitly publishing individual's identities a generative adversarial network (GAN) was trained on the entire dataset. The images in this video show a neural network learning the visual latent space and then interpolating between archetypical identities within the LFW dataset. + + ### Citations Browse or download the geocoded citation data collected for the LFW dataset. -[add citations table here] - +``` +citations +``` ### Additional Information @@ -67,27 +71,14 @@ Browse or download the geocoded citation data collected for the LFW dataset. - The faces in the LFW dataset were detected using the Viola-Jones haarcascade face detector [^lfw_website] [^lfw-survey] - The LFW dataset is used by several of the largest tech companies in the world including "Google, Facebook, Microsoft Research Asia, Baidu, Tencent, SenseTime, Face++ and Chinese University of Hong Kong." [^lfw_pingan] - All images in the LFW dataset were copied from Yahoo News between 2002 - 2004 -<<<<<<< HEAD -- In 2014, two of the four original authors of the LFW dataset received funding from IARPA and ODNI for their follow up paper [Labeled Faces in the Wild: Updates and New Reporting Procedures](https://www.semanticscholar.org/paper/Labeled-Faces-in-the-Wild-%3A-Updates-and-New-Huang-Learned-Miller/2d3482dcff69c7417c7b933f22de606a0e8e42d4) via IARPA contract number 2014-14071600010 +- In 2014, two of the four original authors of the LFW dataset received funding from IARPA and ODNI for their followup paper [Labeled Faces in the Wild: Updates and New Reporting Procedures](https://www.semanticscholar.org/paper/Labeled-Faces-in-the-Wild-%3A-Updates-and-New-Huang-Learned-Miller/2d3482dcff69c7417c7b933f22de606a0e8e42d4) via IARPA contract number 2014-14071600010 - The dataset includes 2 images of [George Tenet](http://vis-www.cs.umass.edu/lfw/person/George_Tenet.html), the former Director of Central Intelligence (DCI) for the Central Intelligence Agency whose facial biometrics were eventually used to help train facial recognition software in China and Russia -======= -- In 2014, 2/4 of the original authors of the LFW dataset received funding from IARPA and ODNI for their follow up paper "Labeled Faces in the Wild: Updates and New Reporting Procedures" via IARPA contract number 2014-14071600010 -- The LFW dataset was used Center for Intelligent Information Retrieval, the Central Intelligence Agency, the National Security Agency and National - -TODO (need citations for the following) - -- SenseTime, who has relied on LFW for benchmarking their facial recognition performance, is one the leading provider of surveillance to the Chinese Government [need citation for this fact. is it the most? or is that Tencent?] -- Two out of 4 of the original authors received funding from the Office of Director of National Intelligence and IARPA for their 2016 LFW survey follow up report - ->>>>>>> 13d7a450affe8ea4f368a97ea2014faa17702a4c    - - ## Code The LFW dataset is so widely used that a popular code library called Sci-Kit Learn includes a function called `fetch_lfw_people` to download the faces in the LFW dataset. @@ -131,7 +122,6 @@ imageio.imwrite('lfw_montage_960.jpg', montage) ### Supplementary Material - ``` load_file assets/lfw_commercial_use.csv name_display, company_url, example_url, country, description @@ -139,14 +129,14 @@ name_display, company_url, example_url, country, description Text and graphics ©Adam Harvey / megapixels.cc - ------- Ignore text below these lines ------- -Research + +### Research - "In our experiments, we used 10000 images and associated captions from the Faces in the wilddata set [3]." - "This work was supported in part by the Center for Intelligent Information Retrieval, the Central Intelligence Agency, the National Security Agency and National Science Foundation under CAREER award IIS-0546666 and grant IIS-0326249." @@ -156,7 +146,11 @@ Research - This research is based upon work supported in part by the Office of the Director of National Intelligence (ODNI), Intelligence Advanced Research Projects Activity (IARPA), via contract number 2014-14071600010. - From "Labeled Faces in the Wild: Updates and New Reporting Procedures" +- 70% of people in the dataset have only 1 image and 29% have 2 or more images + +### Footnotes [^lfw_www]: <http://vis-www.cs.umass.edu/lfw/results.html> [^lfw_baidu]: Jingtuo Liu, Yafeng Deng, Tao Bai, Zhengping Wei, Chang Huang. Targeting Ultimate Accuracy: Face Recognition via Deep Embedding. <https://arxiv.org/abs/1506.07310> [^lfw_pingan]: Lee, Justin. "PING AN Tech facial recognition receives high score in latest LFW test results". BiometricUpdate.com. Feb 13, 2017. <https://www.biometricupdate.com/201702/ping-an-tech-facial-recognition-receives-high-score-in-latest-lfw-test-results> + diff --git a/site/content/pages/datasets/mars/assets/background.jpg b/site/content/pages/datasets/mars/assets/background.jpg Binary files differnew file mode 100644 index 00000000..f3440590 --- /dev/null +++ b/site/content/pages/datasets/mars/assets/background.jpg diff --git a/site/content/pages/datasets/mars/assets/index.jpg b/site/content/pages/datasets/mars/assets/index.jpg Binary files differnew file mode 100644 index 00000000..e866defd --- /dev/null +++ b/site/content/pages/datasets/mars/assets/index.jpg diff --git a/site/content/pages/datasets/pubfig/assets/background.jpg b/site/content/pages/datasets/pubfig/assets/background.jpg Binary files differnew file mode 100644 index 00000000..db748a8f --- /dev/null +++ b/site/content/pages/datasets/pubfig/assets/background.jpg diff --git a/site/content/pages/datasets/pubfig/assets/index.jpg b/site/content/pages/datasets/pubfig/assets/index.jpg Binary files differnew file mode 100644 index 00000000..2470b35c --- /dev/null +++ b/site/content/pages/datasets/pubfig/assets/index.jpg diff --git a/site/content/pages/datasets/uccs/assets/background.jpg b/site/content/pages/datasets/uccs/assets/background.jpg Binary files differnew file mode 100644 index 00000000..db6b0180 --- /dev/null +++ b/site/content/pages/datasets/uccs/assets/background.jpg diff --git a/site/content/pages/datasets/uccs/assets/index.jpg b/site/content/pages/datasets/uccs/assets/index.jpg Binary files differnew file mode 100644 index 00000000..9809e564 --- /dev/null +++ b/site/content/pages/datasets/uccs/assets/index.jpg diff --git a/site/content/pages/datasets/uccs/index.md b/site/content/pages/datasets/uccs/index.md index d40dce22..be1d2474 100644 --- a/site/content/pages/datasets/uccs/index.md +++ b/site/content/pages/datasets/uccs/index.md @@ -68,7 +68,7 @@ The more recent UCCS version of the dataset received funding from [^funding_uccs - You are welcomed to use these images for academic and journalistic use including for research papers, news stories, presentations. - Please use the following citation: -```MegaPixels.cc Adam Harvey 2013-2109.``` +```MegaPixels.cc Adam Harvey 2013-2019.``` [^funding_sb]: Sapkota, Archana and Boult, Terrance. "Large Scale Unconstrained Open Set Face Database." 2013. [^funding_uccs]: Günther, M. et. al. "Unconstrained Face Detection and Open-Set Face Recognition Challenge," 2018. Arxiv 1708.02337v3.
\ No newline at end of file diff --git a/site/content/pages/datasets/ucf_selfie/assets/background.jpg b/site/content/pages/datasets/ucf_selfie/assets/background.jpg Binary files differnew file mode 100644 index 00000000..877133e5 --- /dev/null +++ b/site/content/pages/datasets/ucf_selfie/assets/background.jpg diff --git a/site/content/pages/datasets/ucf_selfie/assets/background_02.jpg b/site/content/pages/datasets/ucf_selfie/assets/background_02.jpg Binary files differnew file mode 100644 index 00000000..1e092f61 --- /dev/null +++ b/site/content/pages/datasets/ucf_selfie/assets/background_02.jpg diff --git a/site/content/pages/datasets/ucf_selfie/assets/index.jpg b/site/content/pages/datasets/ucf_selfie/assets/index.jpg Binary files differnew file mode 100644 index 00000000..4837f6e3 --- /dev/null +++ b/site/content/pages/datasets/ucf_selfie/assets/index.jpg diff --git a/site/content/pages/datasets/ucf_selfie/assets/index_02.jpg b/site/content/pages/datasets/ucf_selfie/assets/index_02.jpg Binary files differnew file mode 100644 index 00000000..524340d7 --- /dev/null +++ b/site/content/pages/datasets/ucf_selfie/assets/index_02.jpg diff --git a/site/content/pages/datasets/viper/assets/background.jpg b/site/content/pages/datasets/viper/assets/background.jpg Binary files differnew file mode 100644 index 00000000..db0b2857 --- /dev/null +++ b/site/content/pages/datasets/viper/assets/background.jpg diff --git a/site/content/pages/datasets/ytmu/assets/index.jpg b/site/content/pages/datasets/ytmu/assets/index.jpg Binary files differnew file mode 100644 index 00000000..76716847 --- /dev/null +++ b/site/content/pages/datasets/ytmu/assets/index.jpg diff --git a/site/content/pages/datasets/ytmu/assets/index_02.jpg b/site/content/pages/datasets/ytmu/assets/index_02.jpg Binary files differnew file mode 100644 index 00000000..30c863f6 --- /dev/null +++ b/site/content/pages/datasets/ytmu/assets/index_02.jpg diff --git a/site/content/pages/datasets/ytmu/assets/index_03.jpg b/site/content/pages/datasets/ytmu/assets/index_03.jpg Binary files differnew file mode 100644 index 00000000..20ccae90 --- /dev/null +++ b/site/content/pages/datasets/ytmu/assets/index_03.jpg diff --git a/site/content/pages/datasets/ytmu/assets/index_04.jpg b/site/content/pages/datasets/ytmu/assets/index_04.jpg Binary files differnew file mode 100644 index 00000000..3d67baac --- /dev/null +++ b/site/content/pages/datasets/ytmu/assets/index_04.jpg |
