The query we used in the RJMetrics benchmark report "The State of Data Science" to identify data scientist profiles.
/* | |
Look for Data Scientists in the following 9 languages: | |
-- English | |
-- Spanish | |
-- French | |
-- German | |
-- Dutch | |
-- Swedish | |
-- Italian | |
-- Portuguese | |
-- Turkish | |
*/ | |
drop table if exists linkedin_people.data_scientists_pid; | |
create table linkedin_people.data_scientists_pid distkey(li_person_id) as | |
( | |
/* | |
Add levels: | |
-- executive | |
Chief DS, Chief Data Officer (not Digital Officer), CMO, COO, | |
CEO, CTO, founder, co-founder, owner, SVP, VP, president | |
-- senior | |
director, manager, lead, head, senior data scientist, principal | |
-- junior | |
everybody else, but not in academia | |
-- academic | |
professor, lecturer | |
-- questionable | |
have words "hiring", "looking for" in the headline | |
*/ | |
select li_person_id, li_company_id, company_name, first_name, last_name, title, headline, | |
case | |
when | |
( | |
headline like '%chief%' or | |
headline like '%president%' or | |
headline like '%ceo%' or | |
(headline like '%amministratore delegato%' and country_code = 'IT') /* Italian */ or | |
(headline like '%verkst%llande direkt%r%' and country_code = 'SE') /* Swedish */ or | |
headline like '%director ejecutivo%' /* Spanish */ or | |
headline like '%cmo%' or | |
headline like 'coo %' or | |
headline like '% coo' or | |
headline like '% coo %' or | |
headline like '%/coo' or | |
(headline like '%pr%sident directeur g%n%ral%' and country_code = 'FR') /* French */ or | |
(headline like '%algemeen directeur%' and country_code = 'NL') /* Dutch */ or | |
(headline like '%ba% i%letme g%revlisi%' and country_code = 'TR') /* Turkish */ or | |
(headline like '%diretor de opera%es%' and (country_code = 'BR' or country_code = 'PT')) /* Portuguese */ or | |
headline like '%director de operaciones%' /* Spanish */ or | |
headline like 'cto %' /* English, German, Italian, Swedish */ or | |
headline like '% cto' or | |
headline like '% cto %' or | |
headline like '%/cto' or | |
(headline like '%directeur de la technologie%' and country_code = 'FR') /* French */ or | |
(headline like '%diretor de tecnologia%' and (country_code = 'BR' or country_code = 'PT')) /* Portuguese */ or | |
(headline like '%hoofd technologie%' and country_code = 'NL') /* Dutch */ or | |
(headline like '%teknolojiden sorumlu ba%kan%' and country_code = 'TR') /* Turkish */ or | |
headline like '%director tecnol%gico%' /* Spanish */ or | |
(headline like '%founder%' and headline not like '%group%') /* English */ or | |
(headline like '%fondateur%' and country_code = 'FR') /* French */ or | |
(headline like '%gr%nder%' and country_code = 'DE') /* German */ or | |
(headline like '%oprichter%' and country_code = 'NL') /* Dutch */ or | |
(headline like '%fondatore%' and country_code = 'IT') /* Italian */ or | |
(headline like '%grundare%' and country_code = 'SE') /* Swedish */ or | |
(headline like '%kurucu%' and country_code = 'TR') /* Turkish */ or | |
headline like '%fundador%' /* Portuguese, Spanish */ or | |
headline like '%owner %' or | |
headline like '% owner%' or | |
headline like '%propri%ta%r%' /* French, Italian, Portuguese */ or | |
(headline like '%inhaber%' and country_code = 'DE') /* German */ or | |
(headline like '%eigenaar%' and country_code = 'NL') /* Dutch */ or | |
(headline like '%sahip%' and country_code = 'TR') /* Turkish */ or | |
headline like '%propietario%' /* Spanish */ or | |
(headline like '%vp%' and headline not like '%mvp%') or | |
headline like '%vice%president%' /* English, French, Dutch, Italian, Swedish, Portuguese, Spanish */ or | |
(headline like '%vizepr%sident%' and country_code = 'DE') /* German */ or | |
(headline like '%ba%kan yard%mc%s%' and country_code = 'TR') /* Turkish */ or | |
title like '%chief%' or | |
title like '%vp%' or | |
title like '%president%' or | |
title like '%ceo%' or | |
(title like '%amministratore delegato%' and country_code = 'IT') /* Italian */ or | |
(title like '%verkst%llande direkt%r%' and country_code = 'SE') /* Swedish */ or | |
title like '%director ejecutivo%' /* Spanish */ or | |
title like '%cmo%' or | |
title like 'coo %' or | |
title like '% coo' or | |
title like '% coo %' or | |
title like '%/coo' or | |
(title like '%pr%sident directeur g%n%ral%' and country_code = 'FR') /* French */ or | |
(title like '%algemeen directeur%' and country_code = 'NL') /* Dutch */ or | |
(title like '%ba% i%letme g%revlisi%' and country_code = 'TR') /* Turkish */ or | |
(title like '%diretor de opera%es%' and (country_code = 'BR' or country_code = 'PT')) /* Portuguese */ or | |
title like '%director de operaciones%' /* Spanish */ or | |
title like 'cto %' /* English, German, Italian, Swedish */ or | |
title like '% cto' or | |
title like '% cto %' or | |
title like '%/cto' or | |
(title like '%directeur de la technologie%' and country_code = 'FR') /* French */ or | |
(title like '%diretor de tecnologia%' and (country_code = 'BR' or country_code = 'PT')) /* Portuguese */ or | |
(title like '%hoofd technologie%' and country_code = 'NL') /* Dutch */ or | |
(title like '%teknolojiden sorumlu ba%kan%' and country_code = 'TR') /* Turkish */ or | |
title like '%director tecnol%gico%' /* Spanish */ or | |
(title like '%founder%' and title not like '%group%') /* English */ or | |
(title like '%fondateur%' and country_code = 'FR') /* French */ or | |
(title like '%gr%nder%' and country_code = 'DE') /* German */ or | |
(title like '%oprichter%' and country_code = 'NL') /* Dutch */ or | |
(title like '%fondatore%' and country_code = 'IT') /* Italian */ or | |
(title like '%grundare%' and country_code = 'SE') /* Swedish */ or | |
(title like '%kurucu%' and country_code = 'TR') /* Turkish */ or | |
title like '%fundador%' /* Portuguese, Spanish */ or | |
title like '%owner %' or | |
title like '% owner%' or | |
title like '%propri%ta%r%' /* French, Italian, Portuguese */ or | |
(title like '%inhaber%' and country_code = 'DE') /* German */ or | |
(title like '%eigenaar%' and country_code = 'NL') /* Dutch */ or | |
(title like '%sahip%' and country_code = 'TR') /* Turkish */ or | |
title like '%propietario%' /* Spanish */ or | |
title like '%vice%president%' /* English, French, Dutch, Italian, Swedish, Portuguese, Spanish */ or | |
(title like '%vizepr%sident%' and country_code = 'DE') /* German */ or | |
(title like '%ba%kan yard%mc%s%' and country_code = 'TR') /* Turkish */ or | |
/* | |
Explicit Chief Data Scientist titles | |
*/ | |
headline like '%chief data%scientist%' /* English, Dutch */ or | |
headline like '%jefe cient%fico de datos%' /* Spanish */ or | |
headline like '%scientifique%chef de donn%es%' /* French */ or | |
headline like '%chef%daten%wissenschaftler%' /* German */ or | |
headline like '%cientista%chefe dados%' /* Portuguese */ or | |
headline like '%scienziato%dati capo%' /* Italian */ or | |
headline like '%ba%veri bilimci%' /* Turkish */ or | |
title like '%chief data%scientist%' /* English, Dutch */ or | |
title like '%jefe cient%fico de datos%' /* Spanish */ or | |
title like '%scientifique%chef de donn%es%' /* French */ or | |
title like '%chef%daten%wissenschaftler%' /* German */ or | |
title like '%cientista%chefe dados%' /* Portuguese */ or | |
title like '%scienziato%dati capo%' /* Italian */ or | |
title like '%ba%veri bilimci%' /* Turkish */ or | |
/* | |
Explicit Chief Data Officer titles | |
*/ | |
headline like '%chief data%officer%' /* English, Dutch, German, French */ or | |
headline like '%director de los datos%' /* Spanish */ or | |
headline like '%directeur des donn%es%' /* French */ or | |
(headline like '%direttore dati%' and headline not like '%foundation%')/* Italian */ or | |
headline like '%de dados principal%' /* Portuguese */ or | |
title like '%chief data%officer%' /* English, Dutch, German, French */ or | |
title like '%director de los datos%' /* Spanish */ or | |
title like '%directeur des donn%es%' /* French */ or | |
(title like '%direttore dati%' and title not like '%foundation%') /* Italian */ or | |
title like '%de dados principal%' /* Portuguese */ | |
) then 'executive' | |
when | |
( | |
headline like '%director%' /* English, Spanish */ or | |
(headline like '%directeur%' and (country_code = 'FR' or country_code = 'NL')) /* French, Dutch */ or | |
(headline like '%direttore%' and country_code = 'IT') /* Italian */ or | |
(headline like '%direkt%r%' and (country_code = 'NL' or country_code = 'SE')) /* German, Swedish */ or | |
(headline like '%diretor%' and (country_code = 'BR' or country_code = 'PT')) /* Portuguese */ or | |
headline like '%pr%sident%' /* English, French, German, Dutch, Italian, Swedish, Portuguese, Spanish */ or | |
headline like '%manager%' /* English, French, German, Italian, Dutch */ or | |
(headline like '%responsabile%' and country_code = 'IT') /* Italian */ or | |
(headline like '%ledare%' and country_code = 'SE') /* Swedish */ or | |
(headline like '%m%d%r%' and country_code = 'TR') /* Turkish */ or | |
headline like '%gerente%' /* Portuguese, Spanish */ or | |
headline like '%principal%' or | |
headline like '%senior%' or | |
(headline like '%sr %' and headline not like '%sr base%' and headline not like '%sr. base%') or | |
(headline like '%sr. %' and headline not like '%sr. base%') or | |
headline like '%lead %' or | |
headline like '%lead,%' or | |
headline like '%head %' or | |
headline like '%head,%' or | |
(headline like '%hoofd%' and country_code = 'NL') /* Dutch */ or | |
(headline like '%ba%kan%' and country_code = 'TR') /* Turkish */ or | |
title like '%director%' /* English, Spanish */ or | |
(title like '%directeur%' and (country_code = 'FR' or country_code = 'NL')) /* French, Dutch */ or | |
(title like '%direttore%' and country_code = 'IT') /* Italian */ or | |
(title like '%direkt%r%' and (country_code = 'NL' or country_code = 'SE')) /* German, Swedish */ or | |
(title like '%diretor%' and (country_code = 'BR' or country_code = 'PT')) /* Portuguese */ or | |
title like '%pr%sident%' /* English, French, German, Dutch, Italian, Swedish, Portuguese, Spanish */ or | |
title like '%manager%' /* English, French, German, Italian, Dutch */ or | |
(title like '%responsabile%' and country_code = 'IT') /* Italian */ or | |
(title like '%ledare%' and country_code = 'SE') /* Swedish */ or | |
(title like '%m%d%r%' and country_code = 'TR') /* Turkish */ or | |
title like '%gerente%' /* Portuguese, Spanish */ or | |
title like '%principal%' or | |
title like '%senior%' or | |
(title like '%sr %' and title not like '%sr base%' and title not like '%sr. base%') or | |
(title like '%sr. %' and title not like '%sr. base%') or | |
title like '%lead %' or | |
title like '%lead,%' or | |
title like '%head %' or | |
title like '%head,%' or | |
(title like '%hoofd%' and country_code = 'NL') /* Dutch */ or | |
(title like '%ba%kan%' and country_code = 'TR') /* Turkish */ | |
) | |
and | |
( | |
(headline not like '%academic%' or headline is null) and | |
(title not like '%academic%' or title is null) | |
) then 'senior' | |
when | |
( | |
headline like '%professor%' /* English, Dutch, German, Portuguese, Italian */ or | |
headline like '%profesor%' /* Spanish */ or | |
headline like '%professeur%' /* French */ or | |
headline similar to '%profes_r%' /* Turkish */ or | |
title like '%professor%' /* English, Dutch, German, Portuguese, Italian */ or | |
title like '%profesor%' /* Spanish */ or | |
title like '%professeur%' /* French */ or | |
title similar to '%profes_r%' /* Turkish */ or | |
headline like '%lecturer%' /*English */ or | |
headline like '%lector%' /* Dutch */ or | |
headline like '%charg%de cours%' /* French */ or | |
headline like '%dozent%' /* German */ or | |
headline like '%docente%' /* Italian */ or | |
headline like '%okutman%' /* Turkish */ or | |
title like '%lecturer%' or | |
title like '%lector%' /* Dutch */ or | |
title like '%charg%de cours%' /* French */ or | |
title like '%dozent%' /* German */ or | |
title like '%docente%' /* Italian */ or | |
title like '%okutman%' /* Turkish */ | |
) then 'academic' | |
when | |
( | |
headline like '%hiring%' or | |
headline like '%looking%' or | |
title like '%hiring%' or | |
title like '%looking%' | |
) then 'questionable' | |
else 'junior' | |
end | |
as level, | |
location, country_code, raw_date_started, month_started, year_started, date_started, | |
position_duration, person_industry, num_connections, date_last_visited, date_updated | |
from | |
( | |
select li_person_id, li_company_id, company_name, first_name, last_name, title, headline, | |
location, country_code, raw_date_started, month_started, year_started, date_started, | |
position_duration, person_industry, num_connections, date_last_visited, date_updated | |
from linkedin_people.all_employees_pid | |
where | |
( | |
/* | |
Lecturers and Professors of Data Science | |
*/ | |
( | |
( | |
headline like '%professor%' /* English, Dutch, German, Portuguese, Italian */ or | |
headline like '%profesor%' /* Spanish */ or | |
headline like '%professeur%' /* French */ or | |
headline similar to '%profes_r%' /* Turkish */ or | |
title like '%professor%' /* English, Dutch, German, Portuguese, Italian */ or | |
title like '%profesor%' /* Spanish */ or | |
title like '%professeur%' /* French */ or | |
title similar to '%profes_r%' /* Turkish */ or | |
headline like '%lecturer%' /*English */ or | |
headline like '%lector%' /* Dutch */ or | |
headline like '%charg%de cours%' /* French */ or | |
headline like '%dozent%' /* German */ or | |
headline like '%docente%' /* Italian */ or | |
headline like '%okutman%' /* Turkish */ or | |
title like '%lecturer%' or | |
title like '%lector%' /* Dutch */ or | |
title like '%charg%de cours%' /* French */ or | |
title like '%dozent%' /* German */ or | |
title like '%docente%' /* Italian */ or | |
title like '%okutman%' /* Turkish */ | |
) | |
and | |
( | |
headline like '%data science%' /* English, Dutch, */ or | |
headline like '%ciencia de datos%' /* Spanish */ or | |
headline like '%science des donn%es%' /* French */ or | |
headline like '%daten%wissenschaft%' /* German */ or | |
headline like '%ci%ncia dados%' /* Portuguese */ or | |
headline like '%scienza dati%' /* Italian */ or | |
headline like '%veri bilimi%' /* Turkish */ or | |
title like '%data science%' /* English, Dutch, */ or | |
title like '%ciencia de datos%' /* Spanish */ or | |
title like '%science des donn%es%' /* French */ or | |
title like '%daten%wissenschaft%' /* German */ or | |
title like '%ci%ncia dados%' /* Portuguese */ or | |
title like '%scienza dati%' /* Italian */ or | |
title like '%veri bilimi%' /* Turkish */ | |
) | |
) | |
or | |
/* | |
Executive Level | |
*/ | |
( | |
( | |
headline like '%chief%' or | |
headline like '%president%' or | |
headline like '%ceo%' or | |
(headline like '%amministratore delegato%' and country_code = 'IT') /* Italian */ or | |
(headline like '%verkst%llande direkt%r%' and country_code = 'SE') /* Swedish */ or | |
headline like '%director ejecutivo%' /* Spanish */ or | |
headline like '%cmo%' or | |
headline like 'coo %' or | |
headline like '% coo' or | |
headline like '% coo %' or | |
headline like '%/coo' or | |
(headline like '%pr%sident directeur g%n%ral%' and country_code = 'FR') /* French */ or | |
(headline like '%algemeen directeur%' and country_code = 'NL') /* Dutch */ or | |
(headline like '%ba% i%letme g%revlisi%' and country_code = 'TR') /* Turkish */ or | |
(headline like '%diretor de opera%es%' and (country_code = 'BR' or country_code = 'PT')) /* Portuguese */ or | |
headline like '%director de operaciones%' /* Spanish */ or | |
headline like 'cto %' /* English, German, Italian, Swedish */ or | |
headline like '% cto' or | |
headline like '% cto %' or | |
headline like '%/cto' or | |
(headline like '%directeur de la technologie%' and country_code = 'FR') /* French */ or | |
(headline like '%diretor de tecnologia%' and (country_code = 'BR' or country_code = 'PT')) /* Portuguese */ or | |
(headline like '%hoofd technologie%' and country_code = 'NL') /* Dutch */ or | |
(headline like '%teknolojiden sorumlu ba%kan%' and country_code = 'TR') /* Turkish */ or | |
headline like '%director tecnol%gico%' /* Spanish */ or | |
(headline like '%founder%' and headline not like '%group%') /* English */ or | |
(headline like '%fondateur%' and country_code = 'FR') /* French */ or | |
(headline like '%gr%nder%' and country_code = 'DE') /* German */ or | |
(headline like '%oprichter%' and country_code = 'NL') /* Dutch */ or | |
(headline like '%fondatore%' and country_code = 'IT') /* Italian */ or | |
(headline like '%grundare%' and country_code = 'SE') /* Swedish */ or | |
(headline like '%kurucu%' and country_code = 'TR') /* Turkish */ or | |
headline like '%fundador%' /* Portuguese, Spanish */ or | |
headline like '%owner %' or | |
headline like '% owner%' or | |
headline like '%propri%ta%r%' /* French, Italian, Portuguese */ or | |
(headline like '%inhaber%' and country_code = 'DE') /* German */ or | |
(headline like '%eigenaar%' and country_code = 'NL') /* Dutch */ or | |
(headline like '%sahip%' and country_code = 'TR') /* Turkish */ or | |
headline like '%propietario%' /* Spanish */ or | |
(headline like '%vp%' and headline not like '%mvp%') or | |
headline like '%vice%president%' /* English, French, Dutch, Italian, Swedish, Portuguese, Spanish */ or | |
(headline like '%vizepr%sident%' and country_code = 'DE') /* German */ or | |
(headline like '%ba%kan yard%mc%s%' and country_code = 'TR') /* Turkish */ or | |
title like '%chief%' or | |
title like '%vp%' or | |
title like '%president%' or | |
title like '%ceo%' or | |
(title like '%amministratore delegato%' and country_code = 'IT') /* Italian */ or | |
(title like '%verkst%llande direkt%r%' and country_code = 'SE') /* Swedish */ or | |
title like '%director ejecutivo%' /* Spanish */ or | |
title like '%cmo%' or | |
title like 'coo %' or | |
title like '% coo' or | |
title like '% coo %' or | |
title like '%/coo' or | |
(title like '%pr%sident directeur g%n%ral%' and country_code = 'FR') /* French */ or | |
(title like '%algemeen directeur%' and country_code = 'NL') /* Dutch */ or | |
(title like '%ba% i%letme g%revlisi%' and country_code = 'TR') /* Turkish */ or | |
(title like '%diretor de opera%es%' and (country_code = 'BR' or country_code = 'PT')) /* Portuguese */ or | |
title like '%director de operaciones%' /* Spanish */ or | |
title like 'cto %' /* English, German, Italian, Swedish */ or | |
title like '% cto' or | |
title like '% cto %' or | |
title like '%/cto' or | |
(title like '%directeur de la technologie%' and country_code = 'FR') /* French */ or | |
(title like '%diretor de tecnologia%' and (country_code = 'BR' or country_code = 'PT')) /* Portuguese */ or | |
(title like '%hoofd technologie%' and country_code = 'NL') /* Dutch */ or | |
(title like '%teknolojiden sorumlu ba%kan%' and country_code = 'TR') /* Turkish */ or | |
title like '%director tecnol%gico%' /* Spanish */ or | |
(title like '%founder%' and title not like '%group%') /* English */ or | |
(title like '%fondateur%' and country_code = 'FR') /* French */ or | |
(title like '%gr%nder%' and country_code = 'DE') /* German */ or | |
(title like '%oprichter%' and country_code = 'NL') /* Dutch */ or | |
(title like '%fondatore%' and country_code = 'IT') /* Italian */ or | |
(title like '%grundare%' and country_code = 'SE') /* Swedish */ or | |
(title like '%kurucu%' and country_code = 'TR') /* Turkish */ or | |
title like '%fundador%' /* Portuguese, Spanish */ or | |
title like '%owner %' or | |
title like '% owner%' or | |
title like '%propri%ta%r%' /* French, Italian, Portuguese */ or | |
(title like '%inhaber%' and country_code = 'DE') /* German */ or | |
(title like '%eigenaar%' and country_code = 'NL') /* Dutch */ or | |
(title like '%sahip%' and country_code = 'TR') /* Turkish */ or | |
title like '%propietario%' /* Spanish */ or | |
title like '%vice%president%' /* English, French, Dutch, Italian, Swedish, Portuguese, Spanish */ or | |
(title like '%vizepr%sident%' and country_code = 'DE') /* German */ or | |
(title like '%ba%kan yard%mc%s%' and country_code = 'TR') /* Turkish */ | |
) | |
and | |
( | |
( | |
headline like '%data science%' and | |
lower(company_name) not like '%data science%' and | |
headline not like '% at %data%science%' | |
) /* English, Dutch, */ | |
or | |
headline like '%ciencia de datos%' /* Spanish */ or | |
headline like '%science des donn%es%' /* French */ or | |
headline like '%daten%wissenschaft%' /* German */ or | |
headline like '%ci%ncia dados%' /* Portuguese */ or | |
headline like '%scienza dati%' /* Italian */ or | |
headline like '%veri bilimi%' /* Turkish */ or | |
title like '%data science%' /* English, Dutch, */ or | |
title like '%ciencia de datos%' /* Spanish */ or | |
title like '%science des donn%es%' /* French */ or | |
title like '%daten%wissenschaft%' /* German */ or | |
title like '%ci%ncia dados%' /* Portuguese */ or | |
title like '%scienza dati%' /* Italian */ or | |
title like '%veri bilimi%' /* Turkish */ | |
) | |
) | |
or | |
/* | |
Senior Level | |
*/ | |
( | |
( | |
headline like '%director%' /* English, Spanish */ or | |
(headline like '%directeur%' and (country_code = 'FR' or country_code = 'NL')) /* French, Dutch */ or | |
(headline like '%direttore%' and country_code = 'IT') /* Italian */ or | |
(headline like '%direkt%r%' and (country_code = 'NL' or country_code = 'SE')) /* German, Swedish */ or | |
(headline like '%diretor%' and (country_code = 'BR' or country_code = 'PT')) /* Portuguese */ or | |
headline like '%pr%sident%' /* English, French, German, Dutch, Italian, Swedish, Portuguese, Spanish */ or | |
headline like '%manager%' /* English, French, German, Italian, Dutch */ or | |
(headline like '%responsabile%' and country_code = 'IT') /* Italian */ or | |
(headline like '%ledare%' and country_code = 'SE') /* Swedish */ or | |
(headline like '%m%d%r%' and country_code = 'TR') /* Turkish */ or | |
headline like '%gerente%' /* Portuguese, Spanish */ or | |
headline like '%principal%' or | |
headline like '%senior%' or | |
(headline like '%sr %' and headline not like '%sr base%' and headline not like '%sr. base%') or | |
(headline like '%sr. %' and headline not like '%sr. base%') or | |
headline like '%lead %' or | |
headline like '%lead,%' or | |
headline like '%head %' or | |
headline like '%head,%' or | |
(headline like '%hoofd%' and country_code = 'NL') /* Dutch */ or | |
(headline like '%ba%kan%' and country_code = 'TR') /* Turkish */ or | |
title like '%director%' /* English, Spanish */ or | |
(title like '%directeur%' and (country_code = 'FR' or country_code = 'NL')) /* French, Dutch */ or | |
(title like '%direttore%' and country_code = 'IT') /* Italian */ or | |
(title like '%direkt%r%' and (country_code = 'NL' or country_code = 'SE')) /* German, Swedish */ or | |
(title like '%diretor%' and (country_code = 'BR' or country_code = 'PT')) /* Portuguese */ or | |
title like '%pr%sident%' /* English, French, German, Dutch, Italian, Swedish, Portuguese, Spanish */ or | |
title like '%manager%' /* English, French, German, Italian, Dutch */ or | |
(title like '%responsabile%' and country_code = 'IT') /* Italian */ or | |
(title like '%ledare%' and country_code = 'SE') /* Swedish */ or | |
(title like '%m%d%r%' and country_code = 'TR') /* Turkish */ or | |
title like '%gerente%' /* Portuguese, Spanish */ or | |
title like '%principal%' or | |
title like '%senior%' or | |
(title like '%sr %' and title not like '%sr base%' and title not like '%sr. base%') or | |
(title like '%sr. %' and title not like '%sr. base%') or | |
title like '%lead %' or | |
title like '%lead,%' or | |
title like '%head %' or | |
title like '%head,%' or | |
(title like '%hoofd%' and country_code = 'NL') /* Dutch */ or | |
(title like '%ba%kan%' and country_code = 'TR') /* Turkish */ | |
) | |
and | |
( | |
( | |
headline like '%data science%' and | |
lower(company_name) not like '%data science%' and | |
headline not like '% at %data%science%' | |
) /* English, Dutch, */ or | |
headline like '%ciencia de datos%' /* Spanish */ or | |
headline like '%science des donn%es%' /* French */ or | |
headline like '%daten%wissenschaft%' /* German */ or | |
headline like '%ci%ncia dados%' /* Portuguese */ or | |
headline like '%scienza dati%' /* Italian */ or | |
headline like '%veri bilimi%' /* Turkish */ or | |
title like '%data science%' /* English, Dutch, */ or | |
title like '%ciencia de datos%' /* Spanish */ or | |
title like '%science des donn%es%' /* French */ or | |
title like '%daten%wissenschaft%' /* German */ or | |
title like '%ci%ncia dados%' /* Portuguese */ or | |
title like '%scienza dati%' /* Italian */ or | |
title like '%veri bilimi%' /* Turkish */ | |
) | |
) | |
or | |
/* | |
Explicit Chief Data Scientist titles | |
*/ | |
headline like '%chief data%scientist%' /* English, Dutch */ or | |
headline like '%jefe cient%fico de datos%' /* Spanish */ or | |
headline like '%scientifique%chef de donn%es%' /* French */ or | |
headline like '%chef%daten%wissenschaftler%' /* German */ or | |
headline like '%cientista%chefe dados%' /* Portuguese */ or | |
headline like '%scienziato%dati capo%' /* Italian */ or | |
headline like '%ba%veri bilimci%' /* Turkish */ or | |
title like '%chief data%scientist%' /* English, Dutch */ or | |
title like '%jefe cient%fico de datos%' /* Spanish */ or | |
title like '%scientifique%chef de donn%es%' /* French */ or | |
title like '%chef%daten%wissenschaftler%' /* German */ or | |
title like '%cientista%chefe dados%' /* Portuguese */ or | |
title like '%scienziato%dati capo%' /* Italian */ or | |
title like '%ba%veri bilimci%' /* Turkish */ or | |
/* | |
Explicit Chief Data Officer titles | |
*/ | |
headline like '%chief data%officer%' /* English, Dutch, German, French */ or | |
headline like '%director de los datos%' /* Spanish */ or | |
headline like '%directeur des donn%es%' /* French */ or | |
(headline like '%direttore dati%' and headline not like '%foundation%')/* Italian */ or | |
headline like '%de dados principal%' /* Portuguese */ or | |
title like '%chief data%officer%' /* English, Dutch, German, French */ or | |
title like '%director de los datos%' /* Spanish */ or | |
title like '%directeur des donn%es%' /* French */ or | |
(title like '%direttore dati%' and title not like '%foundation%') /* Italian */ or | |
title like '%de dados principal%' /* Portuguese */ or | |
/* | |
Plain Data Scientists | |
*/ | |
headline like '%data scientist%' /* English, Dutch */ or | |
headline like '%cient%fico de datos%' /* Spanish */ or | |
headline like '%scientifique de donn%es%' /* French */ or | |
headline like '%daten%wis%enschaftler%' /* German */ or | |
headline like '%cientista de dados%' /* Portuguese */ or | |
headline like '%scienziato dati%' /* Italian */ or | |
headline like '%veri bilimci%' /* Turkish */ or | |
title like '%data scientist%' /* English, Dutch */ or | |
title like '%cient%fico de datos%' /* Spanish */ or | |
title like '%scientifique de donn%es%' /* French */ or | |
title like '%daten%wis%enschaftler%' /* German */ or | |
title like '%cientista de dados%' /* Portuguese */ or | |
title like '%scienziato dati%' /* Italian */ or | |
title like '%veri bilimci%' /* Turkish */ | |
) | |
and | |
( | |
/* | |
Chief DS and CDO exceptions | |
*/ | |
(headline not like '%office%of%chief%data%' or headline is null) and | |
(headline not like '%coordonnat%' or headline is null) and | |
(headline not like '%bases de donn%' or headline is null) and | |
(headline not like '%scientifiques et donn%es%' or headline is null) and | |
(headline not like '%scientifique sp%cialis%' or headline is null) and | |
(headline not like '%r%dactrice scientifique%' or headline is null) and | |
(headline not like '%qualit% des donn%es%' or headline is null) and | |
(title not like '%office%of%' or title is null) and | |
(title not like '%coordonnat%' or title is null) and | |
(title not like '%bases de donn%' or title is null) and | |
(title not like '%scientifiques et donn%es%' or title is null) and | |
(title not like '%scientifique sp%cialis%' or title is null) and | |
(title not like '%r%dactrice scientifique%' or title is null) and | |
(title not like '%qualit% des donn%es%' or title is null) and | |
/* | |
Exclude analysts listing data scientist titles | |
*/ | |
(headline not like '%analyst%' or headline is null) /* English, Dutch, German, French */ and | |
(headline not like '%analist%' or headline is null) /* Spanish, Portuguese, Italian, Turkish */ and | |
(title not like '%analyst%' or title is null) /* English, Dutch, German, French */ and | |
(title not like '%analist%' or title is null) /* Spanish, Portuguese, Italian, Turkish */ and | |
/* | |
Exclude people listing DS incubators in their headline | |
*/ | |
(headline not like '%insight data science%' or headline is null) and | |
(headline not like '%data incubator%' or headline is null) and | |
(headline not like '%metis%' or headline is null) and | |
(headline not like '%general assemb%' or headline is null) | |
/* | |
Other exceptions | |
*/ | |
(headline not like '%coordonnat%' or headline is null) and | |
(headline not like '%bases de donn%' or headline is null) and | |
(headline not like '%scientifiques et donn%es%' or headline is null) and | |
(headline not like '%scientifique sp%cialis%' or headline is null) and | |
(headline not like '%r%dactrice scientifique%' or headline is null) and | |
(title not like '%coordonnat%' or title is null) and | |
(title not like '%bases de donn%' or title is null) and | |
(title not like '%scientifiques et donn%es%' or title is null) and | |
(title not like '%scientifique sp%cialis%' or title is null) and | |
(title not like '%r%dactrice scientifique%' or title is null) and | |
(headline not like '%hr%' or headline is null) and | |
(headline not like '%recruiter%' or headline is null) and | |
(headline not like '%exec search%' or headline is null) and | |
(headline not like '%buyer%' or headline is null) and | |
(headline not like '%seller%' or headline is null) and | |
(headline not like '%account dev%' or headline is null) and | |
(headline not like '%student%' or headline is null) and | |
(headline not like '%leading%' or headline is null) and | |
(headline not like '%heading%' or headline is null) and | |
(headline not like '%data science major%' or headline is null) and | |
(title not like '%hr%' or title is null) and | |
(title not like '%recruiter%' or title is null) and | |
(title not like '%exec search%' or title is null) and | |
(title not like '%buyer%' or title is null) and | |
(title not like '%seller%' or title is null) and | |
(title not like '%account dev%' or title is null) and | |
(title not like '%student%' or title is null) and | |
(title not like '%leading%' or title is null) and | |
(title not like '%heading%' or title is null) and | |
(title not like '%data science major%' or title is null) and | |
) | |
) | |
); |
Sign up for free
to join this conversation on GitHub.
Already have an account?
Sign in to comment