Skip to content

Instantly share code, notes, and snippets.

View khaledadrani's full-sized avatar
Doing stuff

Khaled Adrani khaledadrani

Doing stuff
View GitHub Profile
import os
from dotenv import load_dotenv
import requests
#load your credentials through the .env file
def create_headers():
api_key = os.getenv('api_key')
import spacy
import re
ner = spacy.load('trf_ner\model-best')
def test_model():
Check if the model is loaded properly
from fastapi import FastAPI
from pydantic import BaseModel
from utils.nlp import extract_ents
from utils.twitter_api import get_response
app = FastAPI()
class Query(BaseModel):
keyword: str
max_results: int
samples = ["Facebook has a price target of $ 20 for this quarter",
"$ AAPL is gaining a new momentum"]
for doc in ner.pipe(samples):
for ent in doc.ents:
print(ent.label_, ent.text)
#convert raw sentences into list of tuples (token and empty)
def sents2tuples(sents):
res = []
for sent in sents:
tokens = word_tokenize(sent)
res.append([(token,'') for token in tokens])
return res
#with sent2tuples, preprocessing will work just fine with new text
def preprocess( texts):
# Evaluation of trained model
# Start remove 'O' labels
labels = list(crf.classes_)
print("trained labels :",labels)
# start prediction and calculate f-score
y_pred = crf.predict(X_test)
print (metrics.flat_f1_score(y_test, y_pred,
average='weighted', labels=labels,zero_division=True))
crf = sklearn_crfsuite.CRF(
), y_train)
# Utils functions to extract features
def word2features(sent, i):
word = sent[i][0]
#postag = sent[i][1]
features = {
'bias': 1.0,
'word.lower()': word.lower(),
'word[-3:]': word[-3:],
'word[-2:]': word[-2:],
def import_documents_set_iob(train_file_path):
with open(train_file_path, encoding="utf8") as f:
tokens_in_file = f.readlines()
# construct list of list train set format
new_train_set = []
for index_token,token in enumerate(tokens_in_file):
# detect new document
is_new_document = False
khaledadrani /
Created January 17, 2022 13:30
mount google drive to google colab
from google.colab import drive