summaryrefslogblamecommitdiff
path: root/aligncsv.py
blob: ce63a98866ba95bfe98d7fd3939147ccab19a9c2 (plain) (tree)
1
2
3
4
5
6
7
8





                                                                  

                    














                                                
 












                                                     
                                                                                 




                                                                                     

                                                                                   








                                                              
 
                                  
                                                                           
                                                                        



                                                                                    
                             
                                                                                            

















                                                                                  
#!/usr/bin/python
# this formats a csv file to a serious whitespace intended format.

import os
import sys

tabs=True
additionalspaces = 5

fname = sys.argv[1]
if not os.path.exists(fname):
	print "that file doesn't exist"
	exit(0);

f=open(fname,"r");
lines=f.readlines()
f.close();
length=0

for line in lines:
	length=max(length, len(line.split(",")))

print "# number of entries =",length


#setup text array
textarray=range(len(lines)+1)
for x in range(len(lines)+1):
	textarray[x] = range(length)

for x in range(length):
	textarray[-1][x] = 0

#find the longest entry in each line in each position
for lineno in range(len(lines)):
	sp=lines[lineno].split(",")
	for pieceno in range(len(sp)):
		sp[pieceno] = sp[pieceno].strip() + "," #for the comma add a char
		textarray[-1][pieceno] = max(len(sp[pieceno]),textarray[-1][pieceno])

if tabs:
	#make it divisable by 8 (tabs work then)
	for pieceno in range(length):
		if (textarray[-1][pieceno] %8) !=0:
			textarray[-1][pieceno] = (((textarray[-1][pieceno])/8)*8)+8

for lineno in range(len(lines)):
	sp=lines[lineno].split(",")
	for pieceno in range(length):
		textarray[lineno][pieceno] = ""
		if pieceno<len(sp):
			sp[pieceno]= sp[pieceno].strip()
			if pieceno<len(sp)-1:
				sp[pieceno]= sp[pieceno] + ","

			if (tabs):
				n=(textarray[-1][pieceno]-len(sp[pieceno]))
				textarray[lineno][pieceno] = sp[pieceno]
				if (n%8) != 0:
					textarray[lineno][pieceno] += "\t"*((n/8)+1)
				else:
					textarray[lineno][pieceno] += "\t"*((n/8))
			else:
				n=(textarray[-1][pieceno]-len(sp[pieceno])+additionalspaces)
				textarray[lineno][pieceno] = " "*(n) + sp[pieceno]


fname = sys.argv[2]
if not os.path.exists(fname):
	print "that file doesn't exist"
	exit(0);
else:
	f=open(fname,"w");
	for line in textarray[:-1]:
		for piece in line:
			f.write(piece)
		f.write("\n")
	f.close()