Skip to content

Instantly share code, notes, and snippets.

@jthandy
Created October 7, 2015 15:56
Show Gist options
  • Save jthandy/43fa2ac56bd7ffc181f1 to your computer and use it in GitHub Desktop.
Save jthandy/43fa2ac56bd7ffc181f1 to your computer and use it in GitHub Desktop.
The query we used in the RJMetrics benchmark report "The State of Data Science" to identify data scientist profiles.
/*
Look for Data Scientists in the following 9 languages:
-- English
-- Spanish
-- French
-- German
-- Dutch
-- Swedish
-- Italian
-- Portuguese
-- Turkish
*/
drop table if exists linkedin_people.data_scientists_pid;
create table linkedin_people.data_scientists_pid distkey(li_person_id) as
(
/*
Add levels:
-- executive
Chief DS, Chief Data Officer (not Digital Officer), CMO, COO,
CEO, CTO, founder, co-founder, owner, SVP, VP, president
-- senior
director, manager, lead, head, senior data scientist, principal
-- junior
everybody else, but not in academia
-- academic
professor, lecturer
-- questionable
have words "hiring", "looking for" in the headline
*/
select li_person_id, li_company_id, company_name, first_name, last_name, title, headline,
case
when
(
headline like '%chief%' or
headline like '%president%' or
headline like '%ceo%' or
(headline like '%amministratore delegato%' and country_code = 'IT') /* Italian */ or
(headline like '%verkst%llande direkt%r%' and country_code = 'SE') /* Swedish */ or
headline like '%director ejecutivo%' /* Spanish */ or
headline like '%cmo%' or
headline like 'coo %' or
headline like '% coo' or
headline like '% coo %' or
headline like '%/coo' or
(headline like '%pr%sident directeur g%n%ral%' and country_code = 'FR') /* French */ or
(headline like '%algemeen directeur%' and country_code = 'NL') /* Dutch */ or
(headline like '%ba% i%letme g%revlisi%' and country_code = 'TR') /* Turkish */ or
(headline like '%diretor de opera%es%' and (country_code = 'BR' or country_code = 'PT')) /* Portuguese */ or
headline like '%director de operaciones%' /* Spanish */ or
headline like 'cto %' /* English, German, Italian, Swedish */ or
headline like '% cto' or
headline like '% cto %' or
headline like '%/cto' or
(headline like '%directeur de la technologie%' and country_code = 'FR') /* French */ or
(headline like '%diretor de tecnologia%' and (country_code = 'BR' or country_code = 'PT')) /* Portuguese */ or
(headline like '%hoofd technologie%' and country_code = 'NL') /* Dutch */ or
(headline like '%teknolojiden sorumlu ba%kan%' and country_code = 'TR') /* Turkish */ or
headline like '%director tecnol%gico%' /* Spanish */ or
(headline like '%founder%' and headline not like '%group%') /* English */ or
(headline like '%fondateur%' and country_code = 'FR') /* French */ or
(headline like '%gr%nder%' and country_code = 'DE') /* German */ or
(headline like '%oprichter%' and country_code = 'NL') /* Dutch */ or
(headline like '%fondatore%' and country_code = 'IT') /* Italian */ or
(headline like '%grundare%' and country_code = 'SE') /* Swedish */ or
(headline like '%kurucu%' and country_code = 'TR') /* Turkish */ or
headline like '%fundador%' /* Portuguese, Spanish */ or
headline like '%owner %' or
headline like '% owner%' or
headline like '%propri%ta%r%' /* French, Italian, Portuguese */ or
(headline like '%inhaber%' and country_code = 'DE') /* German */ or
(headline like '%eigenaar%' and country_code = 'NL') /* Dutch */ or
(headline like '%sahip%' and country_code = 'TR') /* Turkish */ or
headline like '%propietario%' /* Spanish */ or
(headline like '%vp%' and headline not like '%mvp%') or
headline like '%vice%president%' /* English, French, Dutch, Italian, Swedish, Portuguese, Spanish */ or
(headline like '%vizepr%sident%' and country_code = 'DE') /* German */ or
(headline like '%ba%kan yard%mc%s%' and country_code = 'TR') /* Turkish */ or
title like '%chief%' or
title like '%vp%' or
title like '%president%' or
title like '%ceo%' or
(title like '%amministratore delegato%' and country_code = 'IT') /* Italian */ or
(title like '%verkst%llande direkt%r%' and country_code = 'SE') /* Swedish */ or
title like '%director ejecutivo%' /* Spanish */ or
title like '%cmo%' or
title like 'coo %' or
title like '% coo' or
title like '% coo %' or
title like '%/coo' or
(title like '%pr%sident directeur g%n%ral%' and country_code = 'FR') /* French */ or
(title like '%algemeen directeur%' and country_code = 'NL') /* Dutch */ or
(title like '%ba% i%letme g%revlisi%' and country_code = 'TR') /* Turkish */ or
(title like '%diretor de opera%es%' and (country_code = 'BR' or country_code = 'PT')) /* Portuguese */ or
title like '%director de operaciones%' /* Spanish */ or
title like 'cto %' /* English, German, Italian, Swedish */ or
title like '% cto' or
title like '% cto %' or
title like '%/cto' or
(title like '%directeur de la technologie%' and country_code = 'FR') /* French */ or
(title like '%diretor de tecnologia%' and (country_code = 'BR' or country_code = 'PT')) /* Portuguese */ or
(title like '%hoofd technologie%' and country_code = 'NL') /* Dutch */ or
(title like '%teknolojiden sorumlu ba%kan%' and country_code = 'TR') /* Turkish */ or
title like '%director tecnol%gico%' /* Spanish */ or
(title like '%founder%' and title not like '%group%') /* English */ or
(title like '%fondateur%' and country_code = 'FR') /* French */ or
(title like '%gr%nder%' and country_code = 'DE') /* German */ or
(title like '%oprichter%' and country_code = 'NL') /* Dutch */ or
(title like '%fondatore%' and country_code = 'IT') /* Italian */ or
(title like '%grundare%' and country_code = 'SE') /* Swedish */ or
(title like '%kurucu%' and country_code = 'TR') /* Turkish */ or
title like '%fundador%' /* Portuguese, Spanish */ or
title like '%owner %' or
title like '% owner%' or
title like '%propri%ta%r%' /* French, Italian, Portuguese */ or
(title like '%inhaber%' and country_code = 'DE') /* German */ or
(title like '%eigenaar%' and country_code = 'NL') /* Dutch */ or
(title like '%sahip%' and country_code = 'TR') /* Turkish */ or
title like '%propietario%' /* Spanish */ or
title like '%vice%president%' /* English, French, Dutch, Italian, Swedish, Portuguese, Spanish */ or
(title like '%vizepr%sident%' and country_code = 'DE') /* German */ or
(title like '%ba%kan yard%mc%s%' and country_code = 'TR') /* Turkish */ or
/*
Explicit Chief Data Scientist titles
*/
headline like '%chief data%scientist%' /* English, Dutch */ or
headline like '%jefe cient%fico de datos%' /* Spanish */ or
headline like '%scientifique%chef de donn%es%' /* French */ or
headline like '%chef%daten%wissenschaftler%' /* German */ or
headline like '%cientista%chefe dados%' /* Portuguese */ or
headline like '%scienziato%dati capo%' /* Italian */ or
headline like '%ba%veri bilimci%' /* Turkish */ or
title like '%chief data%scientist%' /* English, Dutch */ or
title like '%jefe cient%fico de datos%' /* Spanish */ or
title like '%scientifique%chef de donn%es%' /* French */ or
title like '%chef%daten%wissenschaftler%' /* German */ or
title like '%cientista%chefe dados%' /* Portuguese */ or
title like '%scienziato%dati capo%' /* Italian */ or
title like '%ba%veri bilimci%' /* Turkish */ or
/*
Explicit Chief Data Officer titles
*/
headline like '%chief data%officer%' /* English, Dutch, German, French */ or
headline like '%director de los datos%' /* Spanish */ or
headline like '%directeur des donn%es%' /* French */ or
(headline like '%direttore dati%' and headline not like '%foundation%')/* Italian */ or
headline like '%de dados principal%' /* Portuguese */ or
title like '%chief data%officer%' /* English, Dutch, German, French */ or
title like '%director de los datos%' /* Spanish */ or
title like '%directeur des donn%es%' /* French */ or
(title like '%direttore dati%' and title not like '%foundation%') /* Italian */ or
title like '%de dados principal%' /* Portuguese */
) then 'executive'
when
(
headline like '%director%' /* English, Spanish */ or
(headline like '%directeur%' and (country_code = 'FR' or country_code = 'NL')) /* French, Dutch */ or
(headline like '%direttore%' and country_code = 'IT') /* Italian */ or
(headline like '%direkt%r%' and (country_code = 'NL' or country_code = 'SE')) /* German, Swedish */ or
(headline like '%diretor%' and (country_code = 'BR' or country_code = 'PT')) /* Portuguese */ or
headline like '%pr%sident%' /* English, French, German, Dutch, Italian, Swedish, Portuguese, Spanish */ or
headline like '%manager%' /* English, French, German, Italian, Dutch */ or
(headline like '%responsabile%' and country_code = 'IT') /* Italian */ or
(headline like '%ledare%' and country_code = 'SE') /* Swedish */ or
(headline like '%m%d%r%' and country_code = 'TR') /* Turkish */ or
headline like '%gerente%' /* Portuguese, Spanish */ or
headline like '%principal%' or
headline like '%senior%' or
(headline like '%sr %' and headline not like '%sr base%' and headline not like '%sr. base%') or
(headline like '%sr. %' and headline not like '%sr. base%') or
headline like '%lead %' or
headline like '%lead,%' or
headline like '%head %' or
headline like '%head,%' or
(headline like '%hoofd%' and country_code = 'NL') /* Dutch */ or
(headline like '%ba%kan%' and country_code = 'TR') /* Turkish */ or
title like '%director%' /* English, Spanish */ or
(title like '%directeur%' and (country_code = 'FR' or country_code = 'NL')) /* French, Dutch */ or
(title like '%direttore%' and country_code = 'IT') /* Italian */ or
(title like '%direkt%r%' and (country_code = 'NL' or country_code = 'SE')) /* German, Swedish */ or
(title like '%diretor%' and (country_code = 'BR' or country_code = 'PT')) /* Portuguese */ or
title like '%pr%sident%' /* English, French, German, Dutch, Italian, Swedish, Portuguese, Spanish */ or
title like '%manager%' /* English, French, German, Italian, Dutch */ or
(title like '%responsabile%' and country_code = 'IT') /* Italian */ or
(title like '%ledare%' and country_code = 'SE') /* Swedish */ or
(title like '%m%d%r%' and country_code = 'TR') /* Turkish */ or
title like '%gerente%' /* Portuguese, Spanish */ or
title like '%principal%' or
title like '%senior%' or
(title like '%sr %' and title not like '%sr base%' and title not like '%sr. base%') or
(title like '%sr. %' and title not like '%sr. base%') or
title like '%lead %' or
title like '%lead,%' or
title like '%head %' or
title like '%head,%' or
(title like '%hoofd%' and country_code = 'NL') /* Dutch */ or
(title like '%ba%kan%' and country_code = 'TR') /* Turkish */
)
and
(
(headline not like '%academic%' or headline is null) and
(title not like '%academic%' or title is null)
) then 'senior'
when
(
headline like '%professor%' /* English, Dutch, German, Portuguese, Italian */ or
headline like '%profesor%' /* Spanish */ or
headline like '%professeur%' /* French */ or
headline similar to '%profes_r%' /* Turkish */ or
title like '%professor%' /* English, Dutch, German, Portuguese, Italian */ or
title like '%profesor%' /* Spanish */ or
title like '%professeur%' /* French */ or
title similar to '%profes_r%' /* Turkish */ or
headline like '%lecturer%' /*English */ or
headline like '%lector%' /* Dutch */ or
headline like '%charg%de cours%' /* French */ or
headline like '%dozent%' /* German */ or
headline like '%docente%' /* Italian */ or
headline like '%okutman%' /* Turkish */ or
title like '%lecturer%' or
title like '%lector%' /* Dutch */ or
title like '%charg%de cours%' /* French */ or
title like '%dozent%' /* German */ or
title like '%docente%' /* Italian */ or
title like '%okutman%' /* Turkish */
) then 'academic'
when
(
headline like '%hiring%' or
headline like '%looking%' or
title like '%hiring%' or
title like '%looking%'
) then 'questionable'
else 'junior'
end
as level,
location, country_code, raw_date_started, month_started, year_started, date_started,
position_duration, person_industry, num_connections, date_last_visited, date_updated
from
(
select li_person_id, li_company_id, company_name, first_name, last_name, title, headline,
location, country_code, raw_date_started, month_started, year_started, date_started,
position_duration, person_industry, num_connections, date_last_visited, date_updated
from linkedin_people.all_employees_pid
where
(
/*
Lecturers and Professors of Data Science
*/
(
(
headline like '%professor%' /* English, Dutch, German, Portuguese, Italian */ or
headline like '%profesor%' /* Spanish */ or
headline like '%professeur%' /* French */ or
headline similar to '%profes_r%' /* Turkish */ or
title like '%professor%' /* English, Dutch, German, Portuguese, Italian */ or
title like '%profesor%' /* Spanish */ or
title like '%professeur%' /* French */ or
title similar to '%profes_r%' /* Turkish */ or
headline like '%lecturer%' /*English */ or
headline like '%lector%' /* Dutch */ or
headline like '%charg%de cours%' /* French */ or
headline like '%dozent%' /* German */ or
headline like '%docente%' /* Italian */ or
headline like '%okutman%' /* Turkish */ or
title like '%lecturer%' or
title like '%lector%' /* Dutch */ or
title like '%charg%de cours%' /* French */ or
title like '%dozent%' /* German */ or
title like '%docente%' /* Italian */ or
title like '%okutman%' /* Turkish */
)
and
(
headline like '%data science%' /* English, Dutch, */ or
headline like '%ciencia de datos%' /* Spanish */ or
headline like '%science des donn%es%' /* French */ or
headline like '%daten%wissenschaft%' /* German */ or
headline like '%ci%ncia dados%' /* Portuguese */ or
headline like '%scienza dati%' /* Italian */ or
headline like '%veri bilimi%' /* Turkish */ or
title like '%data science%' /* English, Dutch, */ or
title like '%ciencia de datos%' /* Spanish */ or
title like '%science des donn%es%' /* French */ or
title like '%daten%wissenschaft%' /* German */ or
title like '%ci%ncia dados%' /* Portuguese */ or
title like '%scienza dati%' /* Italian */ or
title like '%veri bilimi%' /* Turkish */
)
)
or
/*
Executive Level
*/
(
(
headline like '%chief%' or
headline like '%president%' or
headline like '%ceo%' or
(headline like '%amministratore delegato%' and country_code = 'IT') /* Italian */ or
(headline like '%verkst%llande direkt%r%' and country_code = 'SE') /* Swedish */ or
headline like '%director ejecutivo%' /* Spanish */ or
headline like '%cmo%' or
headline like 'coo %' or
headline like '% coo' or
headline like '% coo %' or
headline like '%/coo' or
(headline like '%pr%sident directeur g%n%ral%' and country_code = 'FR') /* French */ or
(headline like '%algemeen directeur%' and country_code = 'NL') /* Dutch */ or
(headline like '%ba% i%letme g%revlisi%' and country_code = 'TR') /* Turkish */ or
(headline like '%diretor de opera%es%' and (country_code = 'BR' or country_code = 'PT')) /* Portuguese */ or
headline like '%director de operaciones%' /* Spanish */ or
headline like 'cto %' /* English, German, Italian, Swedish */ or
headline like '% cto' or
headline like '% cto %' or
headline like '%/cto' or
(headline like '%directeur de la technologie%' and country_code = 'FR') /* French */ or
(headline like '%diretor de tecnologia%' and (country_code = 'BR' or country_code = 'PT')) /* Portuguese */ or
(headline like '%hoofd technologie%' and country_code = 'NL') /* Dutch */ or
(headline like '%teknolojiden sorumlu ba%kan%' and country_code = 'TR') /* Turkish */ or
headline like '%director tecnol%gico%' /* Spanish */ or
(headline like '%founder%' and headline not like '%group%') /* English */ or
(headline like '%fondateur%' and country_code = 'FR') /* French */ or
(headline like '%gr%nder%' and country_code = 'DE') /* German */ or
(headline like '%oprichter%' and country_code = 'NL') /* Dutch */ or
(headline like '%fondatore%' and country_code = 'IT') /* Italian */ or
(headline like '%grundare%' and country_code = 'SE') /* Swedish */ or
(headline like '%kurucu%' and country_code = 'TR') /* Turkish */ or
headline like '%fundador%' /* Portuguese, Spanish */ or
headline like '%owner %' or
headline like '% owner%' or
headline like '%propri%ta%r%' /* French, Italian, Portuguese */ or
(headline like '%inhaber%' and country_code = 'DE') /* German */ or
(headline like '%eigenaar%' and country_code = 'NL') /* Dutch */ or
(headline like '%sahip%' and country_code = 'TR') /* Turkish */ or
headline like '%propietario%' /* Spanish */ or
(headline like '%vp%' and headline not like '%mvp%') or
headline like '%vice%president%' /* English, French, Dutch, Italian, Swedish, Portuguese, Spanish */ or
(headline like '%vizepr%sident%' and country_code = 'DE') /* German */ or
(headline like '%ba%kan yard%mc%s%' and country_code = 'TR') /* Turkish */ or
title like '%chief%' or
title like '%vp%' or
title like '%president%' or
title like '%ceo%' or
(title like '%amministratore delegato%' and country_code = 'IT') /* Italian */ or
(title like '%verkst%llande direkt%r%' and country_code = 'SE') /* Swedish */ or
title like '%director ejecutivo%' /* Spanish */ or
title like '%cmo%' or
title like 'coo %' or
title like '% coo' or
title like '% coo %' or
title like '%/coo' or
(title like '%pr%sident directeur g%n%ral%' and country_code = 'FR') /* French */ or
(title like '%algemeen directeur%' and country_code = 'NL') /* Dutch */ or
(title like '%ba% i%letme g%revlisi%' and country_code = 'TR') /* Turkish */ or
(title like '%diretor de opera%es%' and (country_code = 'BR' or country_code = 'PT')) /* Portuguese */ or
title like '%director de operaciones%' /* Spanish */ or
title like 'cto %' /* English, German, Italian, Swedish */ or
title like '% cto' or
title like '% cto %' or
title like '%/cto' or
(title like '%directeur de la technologie%' and country_code = 'FR') /* French */ or
(title like '%diretor de tecnologia%' and (country_code = 'BR' or country_code = 'PT')) /* Portuguese */ or
(title like '%hoofd technologie%' and country_code = 'NL') /* Dutch */ or
(title like '%teknolojiden sorumlu ba%kan%' and country_code = 'TR') /* Turkish */ or
title like '%director tecnol%gico%' /* Spanish */ or
(title like '%founder%' and title not like '%group%') /* English */ or
(title like '%fondateur%' and country_code = 'FR') /* French */ or
(title like '%gr%nder%' and country_code = 'DE') /* German */ or
(title like '%oprichter%' and country_code = 'NL') /* Dutch */ or
(title like '%fondatore%' and country_code = 'IT') /* Italian */ or
(title like '%grundare%' and country_code = 'SE') /* Swedish */ or
(title like '%kurucu%' and country_code = 'TR') /* Turkish */ or
title like '%fundador%' /* Portuguese, Spanish */ or
title like '%owner %' or
title like '% owner%' or
title like '%propri%ta%r%' /* French, Italian, Portuguese */ or
(title like '%inhaber%' and country_code = 'DE') /* German */ or
(title like '%eigenaar%' and country_code = 'NL') /* Dutch */ or
(title like '%sahip%' and country_code = 'TR') /* Turkish */ or
title like '%propietario%' /* Spanish */ or
title like '%vice%president%' /* English, French, Dutch, Italian, Swedish, Portuguese, Spanish */ or
(title like '%vizepr%sident%' and country_code = 'DE') /* German */ or
(title like '%ba%kan yard%mc%s%' and country_code = 'TR') /* Turkish */
)
and
(
(
headline like '%data science%' and
lower(company_name) not like '%data science%' and
headline not like '% at %data%science%'
) /* English, Dutch, */
or
headline like '%ciencia de datos%' /* Spanish */ or
headline like '%science des donn%es%' /* French */ or
headline like '%daten%wissenschaft%' /* German */ or
headline like '%ci%ncia dados%' /* Portuguese */ or
headline like '%scienza dati%' /* Italian */ or
headline like '%veri bilimi%' /* Turkish */ or
title like '%data science%' /* English, Dutch, */ or
title like '%ciencia de datos%' /* Spanish */ or
title like '%science des donn%es%' /* French */ or
title like '%daten%wissenschaft%' /* German */ or
title like '%ci%ncia dados%' /* Portuguese */ or
title like '%scienza dati%' /* Italian */ or
title like '%veri bilimi%' /* Turkish */
)
)
or
/*
Senior Level
*/
(
(
headline like '%director%' /* English, Spanish */ or
(headline like '%directeur%' and (country_code = 'FR' or country_code = 'NL')) /* French, Dutch */ or
(headline like '%direttore%' and country_code = 'IT') /* Italian */ or
(headline like '%direkt%r%' and (country_code = 'NL' or country_code = 'SE')) /* German, Swedish */ or
(headline like '%diretor%' and (country_code = 'BR' or country_code = 'PT')) /* Portuguese */ or
headline like '%pr%sident%' /* English, French, German, Dutch, Italian, Swedish, Portuguese, Spanish */ or
headline like '%manager%' /* English, French, German, Italian, Dutch */ or
(headline like '%responsabile%' and country_code = 'IT') /* Italian */ or
(headline like '%ledare%' and country_code = 'SE') /* Swedish */ or
(headline like '%m%d%r%' and country_code = 'TR') /* Turkish */ or
headline like '%gerente%' /* Portuguese, Spanish */ or
headline like '%principal%' or
headline like '%senior%' or
(headline like '%sr %' and headline not like '%sr base%' and headline not like '%sr. base%') or
(headline like '%sr. %' and headline not like '%sr. base%') or
headline like '%lead %' or
headline like '%lead,%' or
headline like '%head %' or
headline like '%head,%' or
(headline like '%hoofd%' and country_code = 'NL') /* Dutch */ or
(headline like '%ba%kan%' and country_code = 'TR') /* Turkish */ or
title like '%director%' /* English, Spanish */ or
(title like '%directeur%' and (country_code = 'FR' or country_code = 'NL')) /* French, Dutch */ or
(title like '%direttore%' and country_code = 'IT') /* Italian */ or
(title like '%direkt%r%' and (country_code = 'NL' or country_code = 'SE')) /* German, Swedish */ or
(title like '%diretor%' and (country_code = 'BR' or country_code = 'PT')) /* Portuguese */ or
title like '%pr%sident%' /* English, French, German, Dutch, Italian, Swedish, Portuguese, Spanish */ or
title like '%manager%' /* English, French, German, Italian, Dutch */ or
(title like '%responsabile%' and country_code = 'IT') /* Italian */ or
(title like '%ledare%' and country_code = 'SE') /* Swedish */ or
(title like '%m%d%r%' and country_code = 'TR') /* Turkish */ or
title like '%gerente%' /* Portuguese, Spanish */ or
title like '%principal%' or
title like '%senior%' or
(title like '%sr %' and title not like '%sr base%' and title not like '%sr. base%') or
(title like '%sr. %' and title not like '%sr. base%') or
title like '%lead %' or
title like '%lead,%' or
title like '%head %' or
title like '%head,%' or
(title like '%hoofd%' and country_code = 'NL') /* Dutch */ or
(title like '%ba%kan%' and country_code = 'TR') /* Turkish */
)
and
(
(
headline like '%data science%' and
lower(company_name) not like '%data science%' and
headline not like '% at %data%science%'
) /* English, Dutch, */ or
headline like '%ciencia de datos%' /* Spanish */ or
headline like '%science des donn%es%' /* French */ or
headline like '%daten%wissenschaft%' /* German */ or
headline like '%ci%ncia dados%' /* Portuguese */ or
headline like '%scienza dati%' /* Italian */ or
headline like '%veri bilimi%' /* Turkish */ or
title like '%data science%' /* English, Dutch, */ or
title like '%ciencia de datos%' /* Spanish */ or
title like '%science des donn%es%' /* French */ or
title like '%daten%wissenschaft%' /* German */ or
title like '%ci%ncia dados%' /* Portuguese */ or
title like '%scienza dati%' /* Italian */ or
title like '%veri bilimi%' /* Turkish */
)
)
or
/*
Explicit Chief Data Scientist titles
*/
headline like '%chief data%scientist%' /* English, Dutch */ or
headline like '%jefe cient%fico de datos%' /* Spanish */ or
headline like '%scientifique%chef de donn%es%' /* French */ or
headline like '%chef%daten%wissenschaftler%' /* German */ or
headline like '%cientista%chefe dados%' /* Portuguese */ or
headline like '%scienziato%dati capo%' /* Italian */ or
headline like '%ba%veri bilimci%' /* Turkish */ or
title like '%chief data%scientist%' /* English, Dutch */ or
title like '%jefe cient%fico de datos%' /* Spanish */ or
title like '%scientifique%chef de donn%es%' /* French */ or
title like '%chef%daten%wissenschaftler%' /* German */ or
title like '%cientista%chefe dados%' /* Portuguese */ or
title like '%scienziato%dati capo%' /* Italian */ or
title like '%ba%veri bilimci%' /* Turkish */ or
/*
Explicit Chief Data Officer titles
*/
headline like '%chief data%officer%' /* English, Dutch, German, French */ or
headline like '%director de los datos%' /* Spanish */ or
headline like '%directeur des donn%es%' /* French */ or
(headline like '%direttore dati%' and headline not like '%foundation%')/* Italian */ or
headline like '%de dados principal%' /* Portuguese */ or
title like '%chief data%officer%' /* English, Dutch, German, French */ or
title like '%director de los datos%' /* Spanish */ or
title like '%directeur des donn%es%' /* French */ or
(title like '%direttore dati%' and title not like '%foundation%') /* Italian */ or
title like '%de dados principal%' /* Portuguese */ or
/*
Plain Data Scientists
*/
headline like '%data scientist%' /* English, Dutch */ or
headline like '%cient%fico de datos%' /* Spanish */ or
headline like '%scientifique de donn%es%' /* French */ or
headline like '%daten%wis%enschaftler%' /* German */ or
headline like '%cientista de dados%' /* Portuguese */ or
headline like '%scienziato dati%' /* Italian */ or
headline like '%veri bilimci%' /* Turkish */ or
title like '%data scientist%' /* English, Dutch */ or
title like '%cient%fico de datos%' /* Spanish */ or
title like '%scientifique de donn%es%' /* French */ or
title like '%daten%wis%enschaftler%' /* German */ or
title like '%cientista de dados%' /* Portuguese */ or
title like '%scienziato dati%' /* Italian */ or
title like '%veri bilimci%' /* Turkish */
)
and
(
/*
Chief DS and CDO exceptions
*/
(headline not like '%office%of%chief%data%' or headline is null) and
(headline not like '%coordonnat%' or headline is null) and
(headline not like '%bases de donn%' or headline is null) and
(headline not like '%scientifiques et donn%es%' or headline is null) and
(headline not like '%scientifique sp%cialis%' or headline is null) and
(headline not like '%r%dactrice scientifique%' or headline is null) and
(headline not like '%qualit% des donn%es%' or headline is null) and
(title not like '%office%of%' or title is null) and
(title not like '%coordonnat%' or title is null) and
(title not like '%bases de donn%' or title is null) and
(title not like '%scientifiques et donn%es%' or title is null) and
(title not like '%scientifique sp%cialis%' or title is null) and
(title not like '%r%dactrice scientifique%' or title is null) and
(title not like '%qualit% des donn%es%' or title is null) and
/*
Exclude analysts listing data scientist titles
*/
(headline not like '%analyst%' or headline is null) /* English, Dutch, German, French */ and
(headline not like '%analist%' or headline is null) /* Spanish, Portuguese, Italian, Turkish */ and
(title not like '%analyst%' or title is null) /* English, Dutch, German, French */ and
(title not like '%analist%' or title is null) /* Spanish, Portuguese, Italian, Turkish */ and
/*
Exclude people listing DS incubators in their headline
*/
(headline not like '%insight data science%' or headline is null) and
(headline not like '%data incubator%' or headline is null) and
(headline not like '%metis%' or headline is null) and
(headline not like '%general assemb%' or headline is null)
/*
Other exceptions
*/
(headline not like '%coordonnat%' or headline is null) and
(headline not like '%bases de donn%' or headline is null) and
(headline not like '%scientifiques et donn%es%' or headline is null) and
(headline not like '%scientifique sp%cialis%' or headline is null) and
(headline not like '%r%dactrice scientifique%' or headline is null) and
(title not like '%coordonnat%' or title is null) and
(title not like '%bases de donn%' or title is null) and
(title not like '%scientifiques et donn%es%' or title is null) and
(title not like '%scientifique sp%cialis%' or title is null) and
(title not like '%r%dactrice scientifique%' or title is null) and
(headline not like '%hr%' or headline is null) and
(headline not like '%recruiter%' or headline is null) and
(headline not like '%exec search%' or headline is null) and
(headline not like '%buyer%' or headline is null) and
(headline not like '%seller%' or headline is null) and
(headline not like '%account dev%' or headline is null) and
(headline not like '%student%' or headline is null) and
(headline not like '%leading%' or headline is null) and
(headline not like '%heading%' or headline is null) and
(headline not like '%data science major%' or headline is null) and
(title not like '%hr%' or title is null) and
(title not like '%recruiter%' or title is null) and
(title not like '%exec search%' or title is null) and
(title not like '%buyer%' or title is null) and
(title not like '%seller%' or title is null) and
(title not like '%account dev%' or title is null) and
(title not like '%student%' or title is null) and
(title not like '%leading%' or title is null) and
(title not like '%heading%' or title is null) and
(title not like '%data science major%' or title is null) and
)
)
);
Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment