Create a gist now

Instantly share code, notes, and snippets.

What would you like to do?
The query we used in the RJMetrics benchmark report "The State of Data Science" to identify data scientist profiles.
/*
Look for Data Scientists in the following 9 languages:
-- English
-- Spanish
-- French
-- German
-- Dutch
-- Swedish
-- Italian
-- Portuguese
-- Turkish
*/
drop table if exists linkedin_people.data_scientists_pid;
create table linkedin_people.data_scientists_pid distkey(li_person_id) as
(
/*
Add levels:
-- executive
Chief DS, Chief Data Officer (not Digital Officer), CMO, COO,
CEO, CTO, founder, co-founder, owner, SVP, VP, president
-- senior
director, manager, lead, head, senior data scientist, principal
-- junior
everybody else, but not in academia
-- academic
professor, lecturer
-- questionable
have words "hiring", "looking for" in the headline
*/
select li_person_id, li_company_id, company_name, first_name, last_name, title, headline,
case
when
(
headline like '%chief%' or
headline like '%president%' or
headline like '%ceo%' or
(headline like '%amministratore delegato%' and country_code = 'IT') /* Italian */ or
(headline like '%verkst%llande direkt%r%' and country_code = 'SE') /* Swedish */ or
headline like '%director ejecutivo%' /* Spanish */ or
headline like '%cmo%' or
headline like 'coo %' or
headline like '% coo' or
headline like '% coo %' or
headline like '%/coo' or
(headline like '%pr%sident directeur g%n%ral%' and country_code = 'FR') /* French */ or
(headline like '%algemeen directeur%' and country_code = 'NL') /* Dutch */ or
(headline like '%ba% i%letme g%revlisi%' and country_code = 'TR') /* Turkish */ or
(headline like '%diretor de opera%es%' and (country_code = 'BR' or country_code = 'PT')) /* Portuguese */ or
headline like '%director de operaciones%' /* Spanish */ or
headline like 'cto %' /* English, German, Italian, Swedish */ or
headline like '% cto' or
headline like '% cto %' or
headline like '%/cto' or
(headline like '%directeur de la technologie%' and country_code = 'FR') /* French */ or
(headline like '%diretor de tecnologia%' and (country_code = 'BR' or country_code = 'PT')) /* Portuguese */ or
(headline like '%hoofd technologie%' and country_code = 'NL') /* Dutch */ or
(headline like '%teknolojiden sorumlu ba%kan%' and country_code = 'TR') /* Turkish */ or
headline like '%director tecnol%gico%' /* Spanish */ or
(headline like '%founder%' and headline not like '%group%') /* English */ or
(headline like '%fondateur%' and country_code = 'FR') /* French */ or
(headline like '%gr%nder%' and country_code = 'DE') /* German */ or
(headline like '%oprichter%' and country_code = 'NL') /* Dutch */ or
(headline like '%fondatore%' and country_code = 'IT') /* Italian */ or
(headline like '%grundare%' and country_code = 'SE') /* Swedish */ or
(headline like '%kurucu%' and country_code = 'TR') /* Turkish */ or
headline like '%fundador%' /* Portuguese, Spanish */ or
headline like '%owner %' or
headline like '% owner%' or
headline like '%propri%ta%r%' /* French, Italian, Portuguese */ or
(headline like '%inhaber%' and country_code = 'DE') /* German */ or
(headline like '%eigenaar%' and country_code = 'NL') /* Dutch */ or
(headline like '%sahip%' and country_code = 'TR') /* Turkish */ or
headline like '%propietario%' /* Spanish */ or
(headline like '%vp%' and headline not like '%mvp%') or
headline like '%vice%president%' /* English, French, Dutch, Italian, Swedish, Portuguese, Spanish */ or
(headline like '%vizepr%sident%' and country_code = 'DE') /* German */ or
(headline like '%ba%kan yard%mc%s%' and country_code = 'TR') /* Turkish */ or
title like '%chief%' or
title like '%vp%' or
title like '%president%' or
title like '%ceo%' or
(title like '%amministratore delegato%' and country_code = 'IT') /* Italian */ or
(title like '%verkst%llande direkt%r%' and country_code = 'SE') /* Swedish */ or
title like '%director ejecutivo%' /* Spanish */ or
title like '%cmo%' or
title like 'coo %' or
title like '% coo' or
title like '% coo %' or
title like '%/coo' or
(title like '%pr%sident directeur g%n%ral%' and country_code = 'FR') /* French */ or
(title like '%algemeen directeur%' and country_code = 'NL') /* Dutch */ or
(title like '%ba% i%letme g%revlisi%' and country_code = 'TR') /* Turkish */ or
(title like '%diretor de opera%es%' and (country_code = 'BR' or country_code = 'PT')) /* Portuguese */ or
title like '%director de operaciones%' /* Spanish */ or
title like 'cto %' /* English, German, Italian, Swedish */ or
title like '% cto' or
title like '% cto %' or
title like '%/cto' or
(title like '%directeur de la technologie%' and country_code = 'FR') /* French */ or
(title like '%diretor de tecnologia%' and (country_code = 'BR' or country_code = 'PT')) /* Portuguese */ or
(title like '%hoofd technologie%' and country_code = 'NL') /* Dutch */ or
(title like '%teknolojiden sorumlu ba%kan%' and country_code = 'TR') /* Turkish */ or
title like '%director tecnol%gico%' /* Spanish */ or
(title like '%founder%' and title not like '%group%') /* English */ or
(title like '%fondateur%' and country_code = 'FR') /* French */ or
(title like '%gr%nder%' and country_code = 'DE') /* German */ or
(title like '%oprichter%' and country_code = 'NL') /* Dutch */ or
(title like '%fondatore%' and country_code = 'IT') /* Italian */ or
(title like '%grundare%' and country_code = 'SE') /* Swedish */ or
(title like '%kurucu%' and country_code = 'TR') /* Turkish */ or
title like '%fundador%' /* Portuguese, Spanish */ or
title like '%owner %' or
title like '% owner%' or
title like '%propri%ta%r%' /* French, Italian, Portuguese */ or
(title like '%inhaber%' and country_code = 'DE') /* German */ or
(title like '%eigenaar%' and country_code = 'NL') /* Dutch */ or
(title like '%sahip%' and country_code = 'TR') /* Turkish */ or
title like '%propietario%' /* Spanish */ or
title like '%vice%president%' /* English, French, Dutch, Italian, Swedish, Portuguese, Spanish */ or
(title like '%vizepr%sident%' and country_code = 'DE') /* German */ or
(title like '%ba%kan yard%mc%s%' and country_code = 'TR') /* Turkish */ or
/*
Explicit Chief Data Scientist titles
*/
headline like '%chief data%scientist%' /* English, Dutch */ or
headline like '%jefe cient%fico de datos%' /* Spanish */ or
headline like '%scientifique%chef de donn%es%' /* French */ or
headline like '%chef%daten%wissenschaftler%' /* German */ or
headline like '%cientista%chefe dados%' /* Portuguese */ or
headline like '%scienziato%dati capo%' /* Italian */ or
headline like '%ba%veri bilimci%' /* Turkish */ or
title like '%chief data%scientist%' /* English, Dutch */ or
title like '%jefe cient%fico de datos%' /* Spanish */ or
title like '%scientifique%chef de donn%es%' /* French */ or
title like '%chef%daten%wissenschaftler%' /* German */ or
title like '%cientista%chefe dados%' /* Portuguese */ or
title like '%scienziato%dati capo%' /* Italian */ or
title like '%ba%veri bilimci%' /* Turkish */ or
/*
Explicit Chief Data Officer titles
*/
headline like '%chief data%officer%' /* English, Dutch, German, French */ or
headline like '%director de los datos%' /* Spanish */ or
headline like '%directeur des donn%es%' /* French */ or
(headline like '%direttore dati%' and headline not like '%foundation%')/* Italian */ or
headline like '%de dados principal%' /* Portuguese */ or
title like '%chief data%officer%' /* English, Dutch, German, French */ or
title like '%director de los datos%' /* Spanish */ or
title like '%directeur des donn%es%' /* French */ or
(title like '%direttore dati%' and title not like '%foundation%') /* Italian */ or
title like '%de dados principal%' /* Portuguese */
) then 'executive'
when
(
headline like '%director%' /* English, Spanish */ or
(headline like '%directeur%' and (country_code = 'FR' or country_code = 'NL')) /* French, Dutch */ or
(headline like '%direttore%' and country_code = 'IT') /* Italian */ or
(headline like '%direkt%r%' and (country_code = 'NL' or country_code = 'SE')) /* German, Swedish */ or
(headline like '%diretor%' and (country_code = 'BR' or country_code = 'PT')) /* Portuguese */ or
headline like '%pr%sident%' /* English, French, German, Dutch, Italian, Swedish, Portuguese, Spanish */ or
headline like '%manager%' /* English, French, German, Italian, Dutch */ or
(headline like '%responsabile%' and country_code = 'IT') /* Italian */ or
(headline like '%ledare%' and country_code = 'SE') /* Swedish */ or
(headline like '%m%d%r%' and country_code = 'TR') /* Turkish */ or
headline like '%gerente%' /* Portuguese, Spanish */ or
headline like '%principal%' or
headline like '%senior%' or
(headline like '%sr %' and headline not like '%sr base%' and headline not like '%sr. base%') or
(headline like '%sr. %' and headline not like '%sr. base%') or
headline like '%lead %' or
headline like '%lead,%' or
headline like '%head %' or
headline like '%head,%' or
(headline like '%hoofd%' and country_code = 'NL') /* Dutch */ or
(headline like '%ba%kan%' and country_code = 'TR') /* Turkish */ or
title like '%director%' /* English, Spanish */ or
(title like '%directeur%' and (country_code = 'FR' or country_code = 'NL')) /* French, Dutch */ or
(title like '%direttore%' and country_code = 'IT') /* Italian */ or
(title like '%direkt%r%' and (country_code = 'NL' or country_code = 'SE')) /* German, Swedish */ or
(title like '%diretor%' and (country_code = 'BR' or country_code = 'PT')) /* Portuguese */ or
title like '%pr%sident%' /* English, French, German, Dutch, Italian, Swedish, Portuguese, Spanish */ or
title like '%manager%' /* English, French, German, Italian, Dutch */ or
(title like '%responsabile%' and country_code = 'IT') /* Italian */ or
(title like '%ledare%' and country_code = 'SE') /* Swedish */ or
(title like '%m%d%r%' and country_code = 'TR') /* Turkish */ or
title like '%gerente%' /* Portuguese, Spanish */ or
title like '%principal%' or
title like '%senior%' or
(title like '%sr %' and title not like '%sr base%' and title not like '%sr. base%') or
(title like '%sr. %' and title not like '%sr. base%') or
title like '%lead %' or
title like '%lead,%' or
title like '%head %' or
title like '%head,%' or
(title like '%hoofd%' and country_code = 'NL') /* Dutch */ or
(title like '%ba%kan%' and country_code = 'TR') /* Turkish */
)
and
(
(headline not like '%academic%' or headline is null) and
(title not like '%academic%' or title is null)
) then 'senior'
when
(
headline like '%professor%' /* English, Dutch, German, Portuguese, Italian */ or
headline like '%profesor%' /* Spanish */ or
headline like '%professeur%' /* French */ or
headline similar to '%profes_r%' /* Turkish */ or
title like '%professor%' /* English, Dutch, German, Portuguese, Italian */ or
title like '%profesor%' /* Spanish */ or
title like '%professeur%' /* French */ or
title similar to '%profes_r%' /* Turkish */ or
headline like '%lecturer%' /*English */ or
headline like '%lector%' /* Dutch */ or
headline like '%charg%de cours%' /* French */ or
headline like '%dozent%' /* German */ or
headline like '%docente%' /* Italian */ or
headline like '%okutman%' /* Turkish */ or
title like '%lecturer%' or
title like '%lector%' /* Dutch */ or
title like '%charg%de cours%' /* French */ or
title like '%dozent%' /* German */ or
title like '%docente%' /* Italian */ or
title like '%okutman%' /* Turkish */
) then 'academic'
when
(
headline like '%hiring%' or
headline like '%looking%' or
title like '%hiring%' or
title like '%looking%'
) then 'questionable'
else 'junior'
end
as level,
location, country_code, raw_date_started, month_started, year_started, date_started,
position_duration, person_industry, num_connections, date_last_visited, date_updated
from
(
select li_person_id, li_company_id, company_name, first_name, last_name, title, headline,
location, country_code, raw_date_started, month_started, year_started, date_started,
position_duration, person_industry, num_connections, date_last_visited, date_updated
from linkedin_people.all_employees_pid
where
(
/*
Lecturers and Professors of Data Science
*/
(
(
headline like '%professor%' /* English, Dutch, German, Portuguese, Italian */ or
headline like '%profesor%' /* Spanish */ or
headline like '%professeur%' /* French */ or
headline similar to '%profes_r%' /* Turkish */ or
title like '%professor%' /* English, Dutch, German, Portuguese, Italian */ or
title like '%profesor%' /* Spanish */ or
title like '%professeur%' /* French */ or
title similar to '%profes_r%' /* Turkish */ or
headline like '%lecturer%' /*English */ or
headline like '%lector%' /* Dutch */ or
headline like '%charg%de cours%' /* French */ or
headline like '%dozent%' /* German */ or
headline like '%docente%' /* Italian */ or
headline like '%okutman%' /* Turkish */ or
title like '%lecturer%' or
title like '%lector%' /* Dutch */ or
title like '%charg%de cours%' /* French */ or
title like '%dozent%' /* German */ or
title like '%docente%' /* Italian */ or
title like '%okutman%' /* Turkish */
)
and
(
headline like '%data science%' /* English, Dutch, */ or
headline like '%ciencia de datos%' /* Spanish */ or
headline like '%science des donn%es%' /* French */ or
headline like '%daten%wissenschaft%' /* German */ or
headline like '%ci%ncia dados%' /* Portuguese */ or
headline like '%scienza dati%' /* Italian */ or
headline like '%veri bilimi%' /* Turkish */ or
title like '%data science%' /* English, Dutch, */ or
title like '%ciencia de datos%' /* Spanish */ or
title like '%science des donn%es%' /* French */ or
title like '%daten%wissenschaft%' /* German */ or
title like '%ci%ncia dados%' /* Portuguese */ or
title like '%scienza dati%' /* Italian */ or
title like '%veri bilimi%' /* Turkish */
)
)
or
/*
Executive Level
*/
(
(
headline like '%chief%' or
headline like '%president%' or
headline like '%ceo%' or
(headline like '%amministratore delegato%' and country_code = 'IT') /* Italian */ or
(headline like '%verkst%llande direkt%r%' and country_code = 'SE') /* Swedish */ or
headline like '%director ejecutivo%' /* Spanish */ or
headline like '%cmo%' or
headline like 'coo %' or
headline like '% coo' or
headline like '% coo %' or
headline like '%/coo' or
(headline like '%pr%sident directeur g%n%ral%' and country_code = 'FR') /* French */ or
(headline like '%algemeen directeur%' and country_code = 'NL') /* Dutch */ or
(headline like '%ba% i%letme g%revlisi%' and country_code = 'TR') /* Turkish */ or
(headline like '%diretor de opera%es%' and (country_code = 'BR' or country_code = 'PT')) /* Portuguese */ or
headline like '%director de operaciones%' /* Spanish */ or
headline like 'cto %' /* English, German, Italian, Swedish */ or
headline like '% cto' or
headline like '% cto %' or
headline like '%/cto' or
(headline like '%directeur de la technologie%' and country_code = 'FR') /* French */ or
(headline like '%diretor de tecnologia%' and (country_code = 'BR' or country_code = 'PT')) /* Portuguese */ or
(headline like '%hoofd technologie%' and country_code = 'NL') /* Dutch */ or
(headline like '%teknolojiden sorumlu ba%kan%' and country_code = 'TR') /* Turkish */ or
headline like '%director tecnol%gico%' /* Spanish */ or
(headline like '%founder%' and headline not like '%group%') /* English */ or
(headline like '%fondateur%' and country_code = 'FR') /* French */ or
(headline like '%gr%nder%' and country_code = 'DE') /* German */ or
(headline like '%oprichter%' and country_code = 'NL') /* Dutch */ or
(headline like '%fondatore%' and country_code = 'IT') /* Italian */ or
(headline like '%grundare%' and country_code = 'SE') /* Swedish */ or
(headline like '%kurucu%' and country_code = 'TR') /* Turkish */ or
headline like '%fundador%' /* Portuguese, Spanish */ or
headline like '%owner %' or
headline like '% owner%' or
headline like '%propri%ta%r%' /* French, Italian, Portuguese */ or
(headline like '%inhaber%' and country_code = 'DE') /* German */ or
(headline like '%eigenaar%' and country_code = 'NL') /* Dutch */ or
(headline like '%sahip%' and country_code = 'TR') /* Turkish */ or
headline like '%propietario%' /* Spanish */ or
(headline like '%vp%' and headline not like '%mvp%') or
headline like '%vice%president%' /* English, French, Dutch, Italian, Swedish, Portuguese, Spanish */ or
(headline like '%vizepr%sident%' and country_code = 'DE') /* German */ or
(headline like '%ba%kan yard%mc%s%' and country_code = 'TR') /* Turkish */ or
title like '%chief%' or
title like '%vp%' or
title like '%president%' or
title like '%ceo%' or
(title like '%amministratore delegato%' and country_code = 'IT') /* Italian */ or
(title like '%verkst%llande direkt%r%' and country_code = 'SE') /* Swedish */ or
title like '%director ejecutivo%' /* Spanish */ or
title like '%cmo%' or
title like 'coo %' or
title like '% coo' or
title like '% coo %' or
title like '%/coo' or
(title like '%pr%sident directeur g%n%ral%' and country_code = 'FR') /* French */ or
(title like '%algemeen directeur%' and country_code = 'NL') /* Dutch */ or
(title like '%ba% i%letme g%revlisi%' and country_code = 'TR') /* Turkish */ or
(title like '%diretor de opera%es%' and (country_code = 'BR' or country_code = 'PT')) /* Portuguese */ or
title like '%director de operaciones%' /* Spanish */ or
title like 'cto %' /* English, German, Italian, Swedish */ or
title like '% cto' or
title like '% cto %' or
title like '%/cto' or
(title like '%directeur de la technologie%' and country_code = 'FR') /* French */ or
(title like '%diretor de tecnologia%' and (country_code = 'BR' or country_code = 'PT')) /* Portuguese */ or
(title like '%hoofd technologie%' and country_code = 'NL') /* Dutch */ or
(title like '%teknolojiden sorumlu ba%kan%' and country_code = 'TR') /* Turkish */ or
title like '%director tecnol%gico%' /* Spanish */ or
(title like '%founder%' and title not like '%group%') /* English */ or
(title like '%fondateur%' and country_code = 'FR') /* French */ or
(title like '%gr%nder%' and country_code = 'DE') /* German */ or
(title like '%oprichter%' and country_code = 'NL') /* Dutch */ or
(title like '%fondatore%' and country_code = 'IT') /* Italian */ or
(title like '%grundare%' and country_code = 'SE') /* Swedish */ or
(title like '%kurucu%' and country_code = 'TR') /* Turkish */ or
title like '%fundador%' /* Portuguese, Spanish */ or
title like '%owner %' or
title like '% owner%' or
title like '%propri%ta%r%' /* French, Italian, Portuguese */ or
(title like '%inhaber%' and country_code = 'DE') /* German */ or
(title like '%eigenaar%' and country_code = 'NL') /* Dutch */ or
(title like '%sahip%' and country_code = 'TR') /* Turkish */ or
title like '%propietario%' /* Spanish */ or
title like '%vice%president%' /* English, French, Dutch, Italian, Swedish, Portuguese, Spanish */ or
(title like '%vizepr%sident%' and country_code = 'DE') /* German */ or
(title like '%ba%kan yard%mc%s%' and country_code = 'TR') /* Turkish */
)
and
(
(
headline like '%data science%' and
lower(company_name) not like '%data science%' and
headline not like '% at %data%science%'
) /* English, Dutch, */
or
headline like '%ciencia de datos%' /* Spanish */ or
headline like '%science des donn%es%' /* French */ or
headline like '%daten%wissenschaft%' /* German */ or
headline like '%ci%ncia dados%' /* Portuguese */ or
headline like '%scienza dati%' /* Italian */ or
headline like '%veri bilimi%' /* Turkish */ or
title like '%data science%' /* English, Dutch, */ or
title like '%ciencia de datos%' /* Spanish */ or
title like '%science des donn%es%' /* French */ or
title like '%daten%wissenschaft%' /* German */ or
title like '%ci%ncia dados%' /* Portuguese */ or
title like '%scienza dati%' /* Italian */ or
title like '%veri bilimi%' /* Turkish */
)
)
or
/*
Senior Level
*/
(
(
headline like '%director%' /* English, Spanish */ or
(headline like '%directeur%' and (country_code = 'FR' or country_code = 'NL')) /* French, Dutch */ or
(headline like '%direttore%' and country_code = 'IT') /* Italian */ or
(headline like '%direkt%r%' and (country_code = 'NL' or country_code = 'SE')) /* German, Swedish */ or
(headline like '%diretor%' and (country_code = 'BR' or country_code = 'PT')) /* Portuguese */ or
headline like '%pr%sident%' /* English, French, German, Dutch, Italian, Swedish, Portuguese, Spanish */ or
headline like '%manager%' /* English, French, German, Italian, Dutch */ or
(headline like '%responsabile%' and country_code = 'IT') /* Italian */ or
(headline like '%ledare%' and country_code = 'SE') /* Swedish */ or
(headline like '%m%d%r%' and country_code = 'TR') /* Turkish */ or
headline like '%gerente%' /* Portuguese, Spanish */ or
headline like '%principal%' or
headline like '%senior%' or
(headline like '%sr %' and headline not like '%sr base%' and headline not like '%sr. base%') or
(headline like '%sr. %' and headline not like '%sr. base%') or
headline like '%lead %' or
headline like '%lead,%' or
headline like '%head %' or
headline like '%head,%' or
(headline like '%hoofd%' and country_code = 'NL') /* Dutch */ or
(headline like '%ba%kan%' and country_code = 'TR') /* Turkish */ or
title like '%director%' /* English, Spanish */ or
(title like '%directeur%' and (country_code = 'FR' or country_code = 'NL')) /* French, Dutch */ or
(title like '%direttore%' and country_code = 'IT') /* Italian */ or
(title like '%direkt%r%' and (country_code = 'NL' or country_code = 'SE')) /* German, Swedish */ or
(title like '%diretor%' and (country_code = 'BR' or country_code = 'PT')) /* Portuguese */ or
title like '%pr%sident%' /* English, French, German, Dutch, Italian, Swedish, Portuguese, Spanish */ or
title like '%manager%' /* English, French, German, Italian, Dutch */ or
(title like '%responsabile%' and country_code = 'IT') /* Italian */ or
(title like '%ledare%' and country_code = 'SE') /* Swedish */ or
(title like '%m%d%r%' and country_code = 'TR') /* Turkish */ or
title like '%gerente%' /* Portuguese, Spanish */ or
title like '%principal%' or
title like '%senior%' or
(title like '%sr %' and title not like '%sr base%' and title not like '%sr. base%') or
(title like '%sr. %' and title not like '%sr. base%') or
title like '%lead %' or
title like '%lead,%' or
title like '%head %' or
title like '%head,%' or
(title like '%hoofd%' and country_code = 'NL') /* Dutch */ or
(title like '%ba%kan%' and country_code = 'TR') /* Turkish */
)
and
(
(
headline like '%data science%' and
lower(company_name) not like '%data science%' and
headline not like '% at %data%science%'
) /* English, Dutch, */ or
headline like '%ciencia de datos%' /* Spanish */ or
headline like '%science des donn%es%' /* French */ or
headline like '%daten%wissenschaft%' /* German */ or
headline like '%ci%ncia dados%' /* Portuguese */ or
headline like '%scienza dati%' /* Italian */ or
headline like '%veri bilimi%' /* Turkish */ or
title like '%data science%' /* English, Dutch, */ or
title like '%ciencia de datos%' /* Spanish */ or
title like '%science des donn%es%' /* French */ or
title like '%daten%wissenschaft%' /* German */ or
title like '%ci%ncia dados%' /* Portuguese */ or
title like '%scienza dati%' /* Italian */ or
title like '%veri bilimi%' /* Turkish */
)
)
or
/*
Explicit Chief Data Scientist titles
*/
headline like '%chief data%scientist%' /* English, Dutch */ or
headline like '%jefe cient%fico de datos%' /* Spanish */ or
headline like '%scientifique%chef de donn%es%' /* French */ or
headline like '%chef%daten%wissenschaftler%' /* German */ or
headline like '%cientista%chefe dados%' /* Portuguese */ or
headline like '%scienziato%dati capo%' /* Italian */ or
headline like '%ba%veri bilimci%' /* Turkish */ or
title like '%chief data%scientist%' /* English, Dutch */ or
title like '%jefe cient%fico de datos%' /* Spanish */ or
title like '%scientifique%chef de donn%es%' /* French */ or
title like '%chef%daten%wissenschaftler%' /* German */ or
title like '%cientista%chefe dados%' /* Portuguese */ or
title like '%scienziato%dati capo%' /* Italian */ or
title like '%ba%veri bilimci%' /* Turkish */ or
/*
Explicit Chief Data Officer titles
*/
headline like '%chief data%officer%' /* English, Dutch, German, French */ or
headline like '%director de los datos%' /* Spanish */ or
headline like '%directeur des donn%es%' /* French */ or
(headline like '%direttore dati%' and headline not like '%foundation%')/* Italian */ or
headline like '%de dados principal%' /* Portuguese */ or
title like '%chief data%officer%' /* English, Dutch, German, French */ or
title like '%director de los datos%' /* Spanish */ or
title like '%directeur des donn%es%' /* French */ or
(title like '%direttore dati%' and title not like '%foundation%') /* Italian */ or
title like '%de dados principal%' /* Portuguese */ or
/*
Plain Data Scientists
*/
headline like '%data scientist%' /* English, Dutch */ or
headline like '%cient%fico de datos%' /* Spanish */ or
headline like '%scientifique de donn%es%' /* French */ or
headline like '%daten%wis%enschaftler%' /* German */ or
headline like '%cientista de dados%' /* Portuguese */ or
headline like '%scienziato dati%' /* Italian */ or
headline like '%veri bilimci%' /* Turkish */ or
title like '%data scientist%' /* English, Dutch */ or
title like '%cient%fico de datos%' /* Spanish */ or
title like '%scientifique de donn%es%' /* French */ or
title like '%daten%wis%enschaftler%' /* German */ or
title like '%cientista de dados%' /* Portuguese */ or
title like '%scienziato dati%' /* Italian */ or
title like '%veri bilimci%' /* Turkish */
)
and
(
/*
Chief DS and CDO exceptions
*/
(headline not like '%office%of%chief%data%' or headline is null) and
(headline not like '%coordonnat%' or headline is null) and
(headline not like '%bases de donn%' or headline is null) and
(headline not like '%scientifiques et donn%es%' or headline is null) and
(headline not like '%scientifique sp%cialis%' or headline is null) and
(headline not like '%r%dactrice scientifique%' or headline is null) and
(headline not like '%qualit% des donn%es%' or headline is null) and
(title not like '%office%of%' or title is null) and
(title not like '%coordonnat%' or title is null) and
(title not like '%bases de donn%' or title is null) and
(title not like '%scientifiques et donn%es%' or title is null) and
(title not like '%scientifique sp%cialis%' or title is null) and
(title not like '%r%dactrice scientifique%' or title is null) and
(title not like '%qualit% des donn%es%' or title is null) and
/*
Exclude analysts listing data scientist titles
*/
(headline not like '%analyst%' or headline is null) /* English, Dutch, German, French */ and
(headline not like '%analist%' or headline is null) /* Spanish, Portuguese, Italian, Turkish */ and
(title not like '%analyst%' or title is null) /* English, Dutch, German, French */ and
(title not like '%analist%' or title is null) /* Spanish, Portuguese, Italian, Turkish */ and
/*
Exclude people listing DS incubators in their headline
*/
(headline not like '%insight data science%' or headline is null) and
(headline not like '%data incubator%' or headline is null) and
(headline not like '%metis%' or headline is null) and
(headline not like '%general assemb%' or headline is null)
/*
Other exceptions
*/
(headline not like '%coordonnat%' or headline is null) and
(headline not like '%bases de donn%' or headline is null) and
(headline not like '%scientifiques et donn%es%' or headline is null) and
(headline not like '%scientifique sp%cialis%' or headline is null) and
(headline not like '%r%dactrice scientifique%' or headline is null) and
(title not like '%coordonnat%' or title is null) and
(title not like '%bases de donn%' or title is null) and
(title not like '%scientifiques et donn%es%' or title is null) and
(title not like '%scientifique sp%cialis%' or title is null) and
(title not like '%r%dactrice scientifique%' or title is null) and
(headline not like '%hr%' or headline is null) and
(headline not like '%recruiter%' or headline is null) and
(headline not like '%exec search%' or headline is null) and
(headline not like '%buyer%' or headline is null) and
(headline not like '%seller%' or headline is null) and
(headline not like '%account dev%' or headline is null) and
(headline not like '%student%' or headline is null) and
(headline not like '%leading%' or headline is null) and
(headline not like '%heading%' or headline is null) and
(headline not like '%data science major%' or headline is null) and
(title not like '%hr%' or title is null) and
(title not like '%recruiter%' or title is null) and
(title not like '%exec search%' or title is null) and
(title not like '%buyer%' or title is null) and
(title not like '%seller%' or title is null) and
(title not like '%account dev%' or title is null) and
(title not like '%student%' or title is null) and
(title not like '%leading%' or title is null) and
(title not like '%heading%' or title is null) and
(title not like '%data science major%' or title is null) and
)
)
);
Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment