Paritosh Kulkarni paritoshk

## gist:129171eb5fed7a40ddd998a69f87cf74
"""
Tech Company Information Extractor

This script extracts information about technology companies from a large text corpus
using the Fireworks AI API. It processes the input in chunks, extracts structured data
based on a predefined schema, and saves the results in multiple formats.

Requirements:
- Python 3.7+
- requests

## barplotfunctions.py
def makelist_ofallstrings(pdrow):

    temp_list =[]
    for i in range(len(pdrow)):
        list_sep = (pdrow[i]).split(sep=',')
        for j in list_sep:
            temp_list.append(j)
    temp_list = [x.strip() for x in temp_list ]
    df_temp = pd.Series(temp_list )
    df_temp = df_temp.astype(str)

## feature.py
"""
df_order1 = pd.read_excel(r'visit_orders_jan_thru_may2018.xlsx') df_order2 = pd.read_excel(r'visit_orders_JUN_thru_DEC2018.xlsx')

df_order_total = pd.concat([df_order1,df_order2])

df_order_total.info

df_order_total.shape
"""

## none_type_go.py
def nonetype_remove(pdrow):
    res = [i for i in pdrow if i]
    return res


## basic_clean.py
def basic_clean(text):
    """"
      A simple function to clean up the data. All the words that
      are not designated as a stop word is then lemmatized after
      encoding and basic regex parsing are performed.
      """
    wnl = nltk.stem.WordNetLemmatizer()
    stopwords = nltk.corpus.stopwords.words('english')
    text = (unicodedata.normalize('NFKD', text)
    .encode('ascii', 'ignore')

## clean_capitalize.py
def basic_cleanandcaptialize(lisofstrings):
    return_list = []
    for string in (lisofstrings):
        string = " ".join(basic_clean(string))
        return_list.append((string.title()))
    return return_list

## Algo_Tag.py
df1['Data_total_grams'] = data
#words_indices_dataframe = pd.DataFrame()
for j in range(len(df1['Data_total_grams'])):
    df1['Data_total_grams'][j] = df1['Data_total_grams'][j].split(sep=',')
    df1['Data_total_grams'][j] = basic_cleanandcaptialize(df1['Data_total_grams'][j])
    for p in range(len(df1['Data_total_grams'][j])):
        #print(len(list_of_strings[p].strip()))

        q = (df1['Data_total_grams'][j][p].strip()).split()


## UX-&-UI-Design-Resources.md

      
              1 file
            
          
              0 forks
            
          
                0 comments
              
            
              0 stars
            
          
                paritoshk
                / UX-&-UI-Design-Resources.md
            
            
              Created
              June 18, 2020 08:51
                — forked from teybannerman/UX-&-UI-Design-Resources.md
            
              
                UX & UI Design Resources
              
          
    UX & UI Design Resources on the Web

Index


Online Prototyping
User Testing & Feedback
UI Design Patterns
Colours & Gradients
User & Profile Photos
Stock Photography
Icons
	"""
	Tech Company Information Extractor

	This script extracts information about technology companies from a large text corpus
	using the Fireworks AI API. It processes the input in chunks, extracts structured data
	based on a predefined schema, and saves the results in multiple formats.

	Requirements:
	- Python 3.7+
	- requests
	def makelist_ofallstrings(pdrow):

	temp_list =[]
	for i in range(len(pdrow)):
	list_sep = (pdrow[i]).split(sep=',')
	for j in list_sep:
	temp_list.append(j)
	temp_list = [x.strip() for x in temp_list ]
	df_temp = pd.Series(temp_list )
	df_temp = df_temp.astype(str)
	"""
	df_order1 = pd.read_excel(r'visit_orders_jan_thru_may2018.xlsx') df_order2 = pd.read_excel(r'visit_orders_JUN_thru_DEC2018.xlsx')

	df_order_total = pd.concat([df_order1,df_order2])

	df_order_total.info

	df_order_total.shape
	"""
	def nonetype_remove(pdrow):
	res = [i for i in pdrow if i]
	return res
	def basic_clean(text):
	""""
	A simple function to clean up the data. All the words that
	are not designated as a stop word is then lemmatized after
	encoding and basic regex parsing are performed.
	"""
	wnl = nltk.stem.WordNetLemmatizer()
	stopwords = nltk.corpus.stopwords.words('english')
	text = (unicodedata.normalize('NFKD', text)
	.encode('ascii', 'ignore')
	def basic_cleanandcaptialize(lisofstrings):
	return_list = []
	for string in (lisofstrings):
	string = " ".join(basic_clean(string))
	return_list.append((string.title()))
	return return_list
	df1['Data_total_grams'] = data
	#words_indices_dataframe = pd.DataFrame()
	for j in range(len(df1['Data_total_grams'])):
	df1['Data_total_grams'][j] = df1['Data_total_grams'][j].split(sep=',')
	df1['Data_total_grams'][j] = basic_cleanandcaptialize(df1['Data_total_grams'][j])
	for p in range(len(df1['Data_total_grams'][j])):
	#print(len(list_of_strings[p].strip()))

	q = (df1['Data_total_grams'][j][p].strip()).split()