Skip to content

Instantly share code, notes, and snippets.

@rajacsp
Created January 13, 2022 03:05
Show Gist options
  • Star 0 You must be signed in to star a gist
  • Fork 0 You must be signed in to fork a gist
  • Save rajacsp/2fe35a83980df4dc2c109fabcad9b66b to your computer and use it in GitHub Desktop.
Save rajacsp/2fe35a83980df4dc2c109fabcad9b66b to your computer and use it in GitHub Desktop.
import pandas as pd
import random
from faker import Faker
faker = Faker()
COUNT = 1000000
def generate_names(count, type):
item_list = []
for i in range(count):
if(type == 'name'):
c_item = faker.name()
elif(type == 'address'):
c_item = faker.address()
print(f'[{i}] : {c_item}')
item_list.append(c_item)
return item_list
def generate_data():
global faker
username_list = generate_names(COUNT, 'name')
address_list = generate_names(COUNT, 'address')
data = pd.DataFrame({
'username' : username_list,
'address' : address_list
})
return data
def startpy():
data = generate_data()
print(data)
data.to_csv('/Users/abc/datasets/user-1m.csv')
if __name__ == '__main__':
startpy()
Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment