Encoding fixes
This commit is contained in:
@@ -36,10 +36,10 @@ def load(saved_classifier_filename, train_data_filename):
|
|||||||
return joblib.load(saved_classifier_filename)
|
return joblib.load(saved_classifier_filename)
|
||||||
except ValueError:
|
except ValueError:
|
||||||
import sys
|
import sys
|
||||||
pickle_options = {}
|
kwargs = {}
|
||||||
if sys.version_info > (3, 0):
|
if sys.version_info > (3, 0):
|
||||||
pickle_options["encoding"] = "bytes"
|
kwargs["encoding"] = "latin1"
|
||||||
|
|
||||||
loaded = pickle.load(open(saved_classifier_filename, 'rb'), **pickle_options)
|
loaded = pickle.load(open(saved_classifier_filename, 'rb'), **kwargs)
|
||||||
joblib.dump(loaded, saved_classifier_filename, compress=True)
|
joblib.dump(loaded, saved_classifier_filename, compress=True)
|
||||||
return loaded
|
return joblib.load(saved_classifier_filename)
|
||||||
|
|||||||
@@ -61,7 +61,7 @@ def parse_msg_sender(filename, sender_known=True):
|
|||||||
import sys
|
import sys
|
||||||
kwargs = {}
|
kwargs = {}
|
||||||
if sys.version_info > (3, 0):
|
if sys.version_info > (3, 0):
|
||||||
kwargs["encoding"] = "bytes"
|
kwargs["encoding"] = "utf8"
|
||||||
|
|
||||||
sender, msg = None, None
|
sender, msg = None, None
|
||||||
if os.path.isfile(filename) and not is_sender_filename(filename):
|
if os.path.isfile(filename) and not is_sender_filename(filename):
|
||||||
|
|||||||
@@ -306,7 +306,7 @@ def extract_reply_and_check(filename):
|
|||||||
import sys
|
import sys
|
||||||
kwargs = {}
|
kwargs = {}
|
||||||
if sys.version_info > (3, 0):
|
if sys.version_info > (3, 0):
|
||||||
kwargs["encoding"] = "bytes"
|
kwargs["encoding"] = "utf8"
|
||||||
|
|
||||||
f = open(filename, **kwargs)
|
f = open(filename, **kwargs)
|
||||||
|
|
||||||
|
|||||||
@@ -27,7 +27,7 @@ def test_messages_longer_SIGNATURE_MAX_LINES():
|
|||||||
import sys
|
import sys
|
||||||
kwargs = {}
|
kwargs = {}
|
||||||
if sys.version_info > (3, 0):
|
if sys.version_info > (3, 0):
|
||||||
kwargs["encoding"] = "bytes"
|
kwargs["encoding"] = "utf8"
|
||||||
|
|
||||||
for filename in os.listdir(STRIPPED):
|
for filename in os.listdir(STRIPPED):
|
||||||
filename = os.path.join(STRIPPED, filename)
|
filename = os.path.join(STRIPPED, filename)
|
||||||
|
|||||||
Reference in New Issue
Block a user