cleanup code

This commit is contained in:
tqchen
2014-05-15 15:01:41 -07:00
parent 3960ac9cb4
commit 37e1473cea
3 changed files with 15 additions and 28 deletions

View File

@@ -6,20 +6,22 @@ def save_data(group_data,output_feature,output_group):
output_group.write(str(len(group_data))+"\n")
for data in group_data:
output_feature.write(data[0] + " " + " ".join(data[2:]) + "\n")
# only include nonzero features
feats = [ p for p in data[2:] if float(p.split(':')[1]) != 0.0 ]
output_feature.write(data[0] + " " + " ".join(feats) + "\n")
if __name__ == "__main__":
if len(sys.argv) != 4:
print "Usage: python trans_data.py [Ranksvm Format Input] [Output Feature File] [Output Group File]"
sys.exit(0)
input = open(sys.argv[1])
fi = open(sys.argv[1])
output_feature = open(sys.argv[2],"w")
output_group = open(sys.argv[3],"w")
group_data = []
group = ""
for line in input:
for line in fi:
if not line:
break
if "#" in line:
@@ -33,8 +35,7 @@ if __name__ == "__main__":
save_data(group_data,output_feature,output_group)
input.close()
fi.close()
output_feature.close()
output_group.close()