Skip to content

Instantly share code, notes, and snippets.

View tsh-code's full-sized avatar

TSH code sharing tsh-code

View GitHub Profile
Your task is to find unique individuals in the given text. As a result, return an array of objects in the given format:
[
{
firstName: string,
lastName: string,
presumedGender: "male" | "female" | "unknown"
}
]
{
"model":"gpt-4",
"messages":[
{
"role":"system",
"content":"Your task is to find unique individuals in the given text. As a result return an array of objects in given format: [{firstName: string, lastName: string, presumedGender: 'male' | 'female' | 'unknown'}] As an answer I expect only an array of objects."
},
{
"role":"user",
"content":"${textGoesHere}"
[
{
"firstName":"Lisa",
"lastName":"Turner",
"presumedGender":"female"
},
{
"firstName":"Mark",
"lastName":"Davis",
"presumedGender":"male"
@tsh-code
tsh-code / compromise-response-2.json
Last active April 4, 2024 10:17
compromise response 2
[
{
"text": "Lisa Turner",
"person": {
"firstName": "lisa",
"lastName": "turner",
"honorific": "",
"presumed_gender": "female"
}
},
@tsh-code
tsh-code / compromise-response-1.json
Last active April 4, 2024 10:18
compromise response 1
[
{
"text": "Lisa Turner, Mark Davis",
"person": {
"firstName": "lisa turner",
"lastName": "mark davis",
"honorific": "",
"presumed_gender": "null"
}
}
from flask import Flask, request
from datasets import load_dataset, Dataset
import json
from nltk.tokenize import sent_tokenize, word_tokenize
nlp = spacy.load("en_core_web_trf")
nlp.add_pipe("span_marker",config={"model": "lxyuan/span-marker-bert-base-multilingual-cased-multinerd"})
app = Flask(__name__)
@tsh-code
tsh-code / spacy-spanmarker.py
Created March 4, 2024 08:26
spacy spanmarker example
import spacy
nlp = spacy.load("en_core_web_trf")
nlp.add_pipe("span_marker", config={"model": "lxyuan/span-marker-bert-base-multilingual-cased-multinerd"})
def extract_people(text: str):
entities = nlp(text)
full_names = set()
for entity in entities.ents:
@tsh-code
tsh-code / spanmarker.py
Created March 4, 2024 08:25
span marker example
from span_marker import SpanMarkerModel
modelPreTrained = SpanMarkerModel.from_pretrained("tomaarsen/span-marker-mbert-base-multinerd")
modelPreTrained.try_cuda()
def extract_people(text:str):
entities = modelPreTrained.predict(text)
full_names = set()
for entity in entities.ents:
if entity['label'] == 'PER':
# Check if the entity has both a first name and a last name
@tsh-code
tsh-code / spacy-flask.py
Created March 4, 2024 08:25
spacy flask example
from flask import Flask, request, jsonify
import spacy
app = Flask(__name__)
nlp = spacy.load("en_core_web_sm")
def extract_people(text: str):
entities = nlp(text)
full_names = set()
[
{
"text": "Lisa Turner",
"person": {
"firstName": "lisa",
"lastName": "turner",
"honorific": "",
"presumed_gender": "female"
}
},