I'm fairly new to Python and am going to be parsing hundreds of thousands of names eventually. What I wanted to do was take individual CSV files, and create new CSV files with only the info I wanted. Then to take the whole lot and combine it into one big file.
This code does that, but I feel I have typed way too much of it.
import csv
csv1 = 'dictionary//first_names.csv'
csv2 = 'dictionary//last_names.csv'
csv3 = 'dictionary//last_name_prefixes.csv'
csv4 = 'dictionary//profanities.csv'
csv5 = 'dictionary//suffixs.csv'
csv6 = 'dictionary//titles.csv'
csv7 = 'dictionary//symbols.csv'
csv8 = 'dictionary//businesses.csv'
csv9 = 'dictionary//initials.csv'
csv10 = 'dictionary//numbers.csv'
csv11 = 'dictionary//removable.csv'
def cleanupCSVFiles(csvFile, uniqueName):
with open(csvFile) as csvfile:
reader = csv.reader(csvfile)
names = [line[0] for line in reader]
with open('MyOutput//'+uniqueName+'.csv', 'w') as f:
for name in names:
f.write('{0}\n'.format(name))
def mergeCSVFiles():
fout=open('MyOutput//AllCSVFiles.csv', 'a')
for num in range (1,11):
for line in open('MyOutput//csv'+str(num)+'.csv'):
fout.write(line)
fout.close()
cleanupCSVFiles(csv1, "csv1")
cleanupCSVFiles(csv2, "csv2")
cleanupCSVFiles(csv3, "csv3")
cleanupCSVFiles(csv4, "csv4")
cleanupCSVFiles(csv5, "csv5")
cleanupCSVFiles(csv6, "csv6")
cleanupCSVFiles(csv7, "csv7")
cleanupCSVFiles(csv8, "csv8")
cleanupCSVFiles(csv9, "csv9")
cleanupCSVFiles(csv10, "csv10")
cleanupCSVFiles(csv11, "csv11")
mergeCSVFiles()