Created
January 13, 2022 03:05
-
-
Save rajacsp/2fe35a83980df4dc2c109fabcad9b66b to your computer and use it in GitHub Desktop.
This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
import pandas as pd | |
import random | |
from faker import Faker | |
faker = Faker() | |
COUNT = 1000000 | |
def generate_names(count, type): | |
item_list = [] | |
for i in range(count): | |
if(type == 'name'): | |
c_item = faker.name() | |
elif(type == 'address'): | |
c_item = faker.address() | |
print(f'[{i}] : {c_item}') | |
item_list.append(c_item) | |
return item_list | |
def generate_data(): | |
global faker | |
username_list = generate_names(COUNT, 'name') | |
address_list = generate_names(COUNT, 'address') | |
data = pd.DataFrame({ | |
'username' : username_list, | |
'address' : address_list | |
}) | |
return data | |
def startpy(): | |
data = generate_data() | |
print(data) | |
data.to_csv('/Users/abc/datasets/user-1m.csv') | |
if __name__ == '__main__': | |
startpy() |
Sign up for free
to join this conversation on GitHub.
Already have an account?
Sign in to comment