Skip to content

Commit b24b1e0

Browse files
committed
fix unicode problems
1 parent 5194268 commit b24b1e0

File tree

3 files changed

+9
-20
lines changed

3 files changed

+9
-20
lines changed

paramgenerator/generateparams.py

Lines changed: 5 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -50,7 +50,7 @@ def registerHandler(self, handler, inputParams, header):
5050
self.inputs.append(inputParams)
5151

5252
def writeCSV(self):
53-
output = codecs.open(self.outputFile, "w", encoding="utf-8")
53+
output = codecs.open( self.outputFile, "w",encoding="utf-8")
5454

5555
if len(self.inputs) == 0:
5656
return
@@ -66,8 +66,7 @@ def writeCSV(self):
6666
handler = self.handlers[j]
6767
data = self.inputs[j][i]
6868
csvLine.append(handler(data))
69-
70-
output.write("|".join(csvLine))
69+
output.write('|'.join([s for s in csvLine]))
7170
output.write("\n")
7271
output.close()
7372

@@ -76,6 +75,7 @@ def handlePersonParam(person):
7675
#return {"PersonID": person, "PersonURI":(PERSON_PREFIX+str("%020d"%person))}
7776

7877
def handleTimeParam(timeParam):
78+
#print timeParam.year
7979
#print timeParam.year
8080
res = str(timegm(date(year=int(timeParam.year),
8181
month=int(timeParam.month), day=int(timeParam.day)).timetuple())*1000)
@@ -242,9 +242,8 @@ def main(argv=None):
242242
# nameParams.extend([nameParams[random.randint(0, oldlen-1)] for j in range(newlen-oldlen)])
243243
nameParams = []
244244
for person in selectedPersonParams[1]:
245-
nameParams.append(givenNames.getValue(person))
246-
247-
print nameParams
245+
n = givenNames.getValue(person)
246+
nameParams.append(n)
248247

249248
# serialize all the parameters as CSV
250249
csvWriters = {}

paramgenerator/readfactors.py

Lines changed: 3 additions & 12 deletions
Original file line numberDiff line numberDiff line change
@@ -45,7 +45,7 @@ class NameParameter:
4545
def __init__(self, persons=[]):
4646
self.values={}
4747
for p in persons:
48-
self.values[p] = ""
48+
self.values[p] = 0
4949

5050
def setValue(self, person, value):
5151
self.values[person] = value
@@ -73,7 +73,8 @@ def load(factorFiles, friendFiles):
7373
person = int(line[0])
7474
if not results.existParam(person):
7575
results.addNewParam(person)
76-
givenNames.setValue(person, line[1])
76+
name = line[1]
77+
givenNames.setValue(person, name)
7778
results.addValue(person, "f", int(line[2]))
7879
results.addValue(person, "p", int(line[3]))
7980
results.addValue(person, "pl", int(line[4]))
@@ -103,11 +104,6 @@ def load(factorFiles, friendFiles):
103104
line = f.readline()
104105
count = line[1+line.rfind(","):]
105106
name = line[:line.rfind(",")]
106-
try:
107-
name.decode('ascii')
108-
except UnicodeEncodeError:
109-
continue
110-
111107
if not name in tags:
112108
tags[name] = 0
113109
tags[name] += int(count)
@@ -116,11 +112,6 @@ def load(factorFiles, friendFiles):
116112
for i in range(nameCount):
117113
line = f.readline().split(",")
118114
name = line[0]
119-
try:
120-
name.decode('ascii')
121-
except UnicodeEncodeError:
122-
continue
123-
124115
if not name in names:
125116
names[name] = 0
126117
names[name] += int(line[1])

paramgenerator/timeparameters.py

Lines changed: 1 addition & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -1,7 +1,6 @@
11
import sys
22
import getopt
33
import math
4-
import random
54
from readfactors import FactorCount
65
from operator import itemgetter
76
import itertools
@@ -68,7 +67,7 @@ def getTimeParamsWithMedian(factors, (medianFirstMonth, medianLastMonth, median)
6867
for values in factors:
6968
input = sorted(values,key=lambda myc: (myc.year, myc.month))
7069
currentMedian = getMedian(values,lambda myc: myc.count, True)
71-
if int(median) == 0 or int(currentMedian.count) == 0:
70+
if int(median) == 0 or int(currentMedian.count) == 0 or int(currentMedian.year) == 0:
7271
res.append(TimeParameter(START_YEAR,1,1,0))
7372
continue
7473
if currentMedian.count > median:

0 commit comments

Comments
 (0)